{"current_steps": 5, "total_steps": 33920, "loss": 6.5898, "lr": 1.179245283018868e-08, "epoch": 0.00294811320754717, "percentage": 0.01, "elapsed_time": "0:00:01", "remaining_time": "2:38:49", "throughput": 2049.97, "total_tokens": 2880} {"current_steps": 10, "total_steps": 33920, "loss": 6.6231, "lr": 2.6533018867924528e-08, "epoch": 0.00589622641509434, "percentage": 0.03, "elapsed_time": "0:00:01", "remaining_time": "1:49:28", "throughput": 2957.0, "total_tokens": 5728} {"current_steps": 15, "total_steps": 33920, "loss": 6.5842, "lr": 4.127358490566038e-08, "epoch": 0.00884433962264151, "percentage": 0.04, "elapsed_time": "0:00:02", "remaining_time": "1:32:00", "throughput": 3577.12, "total_tokens": 8736} {"current_steps": 20, "total_steps": 33920, "loss": 6.5648, "lr": 5.601415094339623e-08, "epoch": 0.01179245283018868, "percentage": 0.06, "elapsed_time": "0:00:02", "remaining_time": "1:22:56", "throughput": 3967.3, "total_tokens": 11648} {"current_steps": 25, "total_steps": 33920, "loss": 6.4989, "lr": 7.075471698113208e-08, "epoch": 0.01474056603773585, "percentage": 0.07, "elapsed_time": "0:00:03", "remaining_time": "1:21:54", "throughput": 4475.65, "total_tokens": 16224} {"current_steps": 30, "total_steps": 33920, "loss": 6.7535, "lr": 8.549528301886793e-08, "epoch": 0.01768867924528302, "percentage": 0.09, "elapsed_time": "0:00:04", "remaining_time": "1:17:30", "throughput": 4648.47, "total_tokens": 19136} {"current_steps": 35, "total_steps": 33920, "loss": 6.3632, "lr": 1.0023584905660378e-07, "epoch": 0.020636792452830188, "percentage": 0.1, "elapsed_time": "0:00:04", "remaining_time": "1:14:14", "throughput": 4827.15, "total_tokens": 22208} {"current_steps": 40, "total_steps": 33920, "loss": 6.7811, "lr": 1.1497641509433962e-07, "epoch": 0.02358490566037736, "percentage": 0.12, "elapsed_time": "0:00:05", "remaining_time": "1:11:25", "throughput": 4857.12, "total_tokens": 24576} {"current_steps": 45, "total_steps": 33920, "loss": 6.83, "lr": 1.297169811320755e-07, "epoch": 0.02653301886792453, "percentage": 0.13, "elapsed_time": "0:00:05", "remaining_time": "1:11:33", "throughput": 5049.94, "total_tokens": 28800} {"current_steps": 50, "total_steps": 33920, "loss": 6.4312, "lr": 1.4445754716981135e-07, "epoch": 0.0294811320754717, "percentage": 0.15, "elapsed_time": "0:00:06", "remaining_time": "1:10:11", "throughput": 5111.58, "total_tokens": 31776} {"current_steps": 55, "total_steps": 33920, "loss": 6.1927, "lr": 1.591981132075472e-07, "epoch": 0.03242924528301887, "percentage": 0.16, "elapsed_time": "0:00:06", "remaining_time": "1:09:45", "throughput": 5244.37, "total_tokens": 35648} {"current_steps": 60, "total_steps": 33920, "loss": 6.5442, "lr": 1.7393867924528304e-07, "epoch": 0.03537735849056604, "percentage": 0.18, "elapsed_time": "0:00:07", "remaining_time": "1:08:31", "throughput": 5301.36, "total_tokens": 38624} {"current_steps": 65, "total_steps": 33920, "loss": 6.2018, "lr": 1.886792452830189e-07, "epoch": 0.038325471698113206, "percentage": 0.19, "elapsed_time": "0:00:07", "remaining_time": "1:07:30", "throughput": 5365.05, "total_tokens": 41728} {"current_steps": 70, "total_steps": 33920, "loss": 6.0513, "lr": 2.0341981132075473e-07, "epoch": 0.041273584905660375, "percentage": 0.21, "elapsed_time": "0:00:08", "remaining_time": "1:06:47", "throughput": 5390.45, "total_tokens": 44672} {"current_steps": 75, "total_steps": 33920, "loss": 6.3024, "lr": 2.1816037735849058e-07, "epoch": 0.044221698113207544, "percentage": 0.22, "elapsed_time": "0:00:08", "remaining_time": "1:06:15", "throughput": 5467.14, "total_tokens": 48160} {"current_steps": 80, "total_steps": 33920, "loss": 6.0573, "lr": 2.3290094339622643e-07, "epoch": 0.04716981132075472, "percentage": 0.24, "elapsed_time": "0:00:09", "remaining_time": "1:06:14", "throughput": 5510.31, "total_tokens": 51776} {"current_steps": 85, "total_steps": 33920, "loss": 6.4386, "lr": 2.476415094339623e-07, "epoch": 0.05011792452830189, "percentage": 0.25, "elapsed_time": "0:00:09", "remaining_time": "1:05:32", "throughput": 5519.7, "total_tokens": 54528} {"current_steps": 90, "total_steps": 33920, "loss": 6.3051, "lr": 2.6238207547169815e-07, "epoch": 0.05306603773584906, "percentage": 0.27, "elapsed_time": "0:00:10", "remaining_time": "1:05:11", "throughput": 5531.64, "total_tokens": 57568} {"current_steps": 95, "total_steps": 33920, "loss": 5.7796, "lr": 2.7712264150943397e-07, "epoch": 0.05601415094339623, "percentage": 0.28, "elapsed_time": "0:00:10", "remaining_time": "1:04:24", "throughput": 5551.02, "total_tokens": 60256} {"current_steps": 100, "total_steps": 33920, "loss": 5.4755, "lr": 2.9186320754716984e-07, "epoch": 0.0589622641509434, "percentage": 0.29, "elapsed_time": "0:00:11", "remaining_time": "1:03:38", "throughput": 5551.79, "total_tokens": 62688} {"current_steps": 105, "total_steps": 33920, "loss": 5.6559, "lr": 3.0660377358490567e-07, "epoch": 0.061910377358490566, "percentage": 0.31, "elapsed_time": "0:00:11", "remaining_time": "1:03:05", "throughput": 5559.12, "total_tokens": 65344} {"current_steps": 110, "total_steps": 33920, "loss": 5.1255, "lr": 3.213443396226416e-07, "epoch": 0.06485849056603774, "percentage": 0.32, "elapsed_time": "0:00:12", "remaining_time": "1:02:45", "throughput": 5594.91, "total_tokens": 68544} {"current_steps": 115, "total_steps": 33920, "loss": 5.5851, "lr": 3.3608490566037736e-07, "epoch": 0.06780660377358491, "percentage": 0.34, "elapsed_time": "0:00:12", "remaining_time": "1:02:17", "throughput": 5610.05, "total_tokens": 71328} {"current_steps": 120, "total_steps": 33920, "loss": 5.1278, "lr": 3.508254716981133e-07, "epoch": 0.07075471698113207, "percentage": 0.35, "elapsed_time": "0:00:13", "remaining_time": "1:01:57", "throughput": 5625.42, "total_tokens": 74240} {"current_steps": 125, "total_steps": 33920, "loss": 5.1234, "lr": 3.6556603773584905e-07, "epoch": 0.07370283018867925, "percentage": 0.37, "elapsed_time": "0:00:13", "remaining_time": "1:01:40", "throughput": 5644.01, "total_tokens": 77248} {"current_steps": 130, "total_steps": 33920, "loss": 5.103, "lr": 3.80306603773585e-07, "epoch": 0.07665094339622641, "percentage": 0.38, "elapsed_time": "0:00:14", "remaining_time": "1:01:32", "throughput": 5680.76, "total_tokens": 80704} {"current_steps": 135, "total_steps": 33920, "loss": 4.762, "lr": 3.9504716981132075e-07, "epoch": 0.07959905660377359, "percentage": 0.4, "elapsed_time": "0:00:14", "remaining_time": "1:01:25", "throughput": 5693.79, "total_tokens": 83840} {"current_steps": 140, "total_steps": 33920, "loss": 5.2388, "lr": 4.097877358490567e-07, "epoch": 0.08254716981132075, "percentage": 0.41, "elapsed_time": "0:00:15", "remaining_time": "1:01:10", "throughput": 5690.75, "total_tokens": 86560} {"current_steps": 145, "total_steps": 33920, "loss": 5.1523, "lr": 4.2452830188679244e-07, "epoch": 0.08549528301886793, "percentage": 0.43, "elapsed_time": "0:00:15", "remaining_time": "1:00:52", "throughput": 5699.64, "total_tokens": 89376} {"current_steps": 150, "total_steps": 33920, "loss": 4.4728, "lr": 4.3926886792452837e-07, "epoch": 0.08844339622641509, "percentage": 0.44, "elapsed_time": "0:00:16", "remaining_time": "1:02:27", "throughput": 5761.11, "total_tokens": 95904} {"current_steps": 155, "total_steps": 33920, "loss": 4.9182, "lr": 4.5400943396226414e-07, "epoch": 0.09139150943396226, "percentage": 0.46, "elapsed_time": "0:00:17", "remaining_time": "1:02:31", "throughput": 5779.49, "total_tokens": 99520} {"current_steps": 160, "total_steps": 33920, "loss": 4.8899, "lr": 4.6875000000000006e-07, "epoch": 0.09433962264150944, "percentage": 0.47, "elapsed_time": "0:00:17", "remaining_time": "1:02:16", "throughput": 5796.35, "total_tokens": 102656} {"current_steps": 165, "total_steps": 33920, "loss": 4.7307, "lr": 4.834905660377359e-07, "epoch": 0.0972877358490566, "percentage": 0.49, "elapsed_time": "0:00:18", "remaining_time": "1:01:57", "throughput": 5795.9, "total_tokens": 105312} {"current_steps": 170, "total_steps": 33920, "loss": 4.9404, "lr": 4.982311320754717e-07, "epoch": 0.10023584905660378, "percentage": 0.5, "elapsed_time": "0:00:18", "remaining_time": "1:01:43", "throughput": 5798.48, "total_tokens": 108160} {"current_steps": 175, "total_steps": 33920, "loss": 4.2148, "lr": 5.129716981132076e-07, "epoch": 0.10318396226415094, "percentage": 0.52, "elapsed_time": "0:00:19", "remaining_time": "1:01:37", "throughput": 5823.96, "total_tokens": 111680} {"current_steps": 180, "total_steps": 33920, "loss": 4.8944, "lr": 5.277122641509435e-07, "epoch": 0.10613207547169812, "percentage": 0.53, "elapsed_time": "0:00:19", "remaining_time": "1:01:32", "throughput": 5834.05, "total_tokens": 114912} {"current_steps": 185, "total_steps": 33920, "loss": 4.2355, "lr": 5.424528301886793e-07, "epoch": 0.10908018867924528, "percentage": 0.55, "elapsed_time": "0:00:20", "remaining_time": "1:01:11", "throughput": 5829.14, "total_tokens": 117376} {"current_steps": 190, "total_steps": 33920, "loss": 4.059, "lr": 5.571933962264151e-07, "epoch": 0.11202830188679246, "percentage": 0.56, "elapsed_time": "0:00:20", "remaining_time": "1:01:01", "throughput": 5838.55, "total_tokens": 120416} {"current_steps": 195, "total_steps": 33920, "loss": 4.4158, "lr": 5.71933962264151e-07, "epoch": 0.11497641509433962, "percentage": 0.57, "elapsed_time": "0:00:21", "remaining_time": "1:00:54", "throughput": 5840.86, "total_tokens": 123424} {"current_steps": 200, "total_steps": 33920, "loss": 4.3497, "lr": 5.866745283018868e-07, "epoch": 0.1179245283018868, "percentage": 0.59, "elapsed_time": "0:00:21", "remaining_time": "1:00:56", "throughput": 5861.48, "total_tokens": 127136} {"current_steps": 205, "total_steps": 33920, "loss": 4.2567, "lr": 6.014150943396227e-07, "epoch": 0.12087264150943396, "percentage": 0.6, "elapsed_time": "0:00:22", "remaining_time": "1:01:18", "throughput": 5894.39, "total_tokens": 131840} {"current_steps": 210, "total_steps": 33920, "loss": 3.9834, "lr": 6.161556603773585e-07, "epoch": 0.12382075471698113, "percentage": 0.62, "elapsed_time": "0:00:22", "remaining_time": "1:01:17", "throughput": 5908.43, "total_tokens": 135360} {"current_steps": 215, "total_steps": 33920, "loss": 4.1029, "lr": 6.308962264150945e-07, "epoch": 0.1267688679245283, "percentage": 0.63, "elapsed_time": "0:00:23", "remaining_time": "1:01:23", "throughput": 5928.98, "total_tokens": 139328} {"current_steps": 220, "total_steps": 33920, "loss": 4.156, "lr": 6.456367924528302e-07, "epoch": 0.12971698113207547, "percentage": 0.65, "elapsed_time": "0:00:24", "remaining_time": "1:01:25", "throughput": 5942.94, "total_tokens": 142976} {"current_steps": 225, "total_steps": 33920, "loss": 3.4806, "lr": 6.603773584905661e-07, "epoch": 0.13266509433962265, "percentage": 0.66, "elapsed_time": "0:00:24", "remaining_time": "1:01:23", "throughput": 5957.22, "total_tokens": 146528} {"current_steps": 230, "total_steps": 33920, "loss": 3.7368, "lr": 6.75117924528302e-07, "epoch": 0.13561320754716982, "percentage": 0.68, "elapsed_time": "0:00:25", "remaining_time": "1:02:09", "throughput": 5976.74, "total_tokens": 152192} {"current_steps": 235, "total_steps": 33920, "loss": 4.0799, "lr": 6.898584905660379e-07, "epoch": 0.13856132075471697, "percentage": 0.69, "elapsed_time": "0:00:25", "remaining_time": "1:01:53", "throughput": 5968.39, "total_tokens": 154624} {"current_steps": 240, "total_steps": 33920, "loss": 4.2881, "lr": 7.045990566037736e-07, "epoch": 0.14150943396226415, "percentage": 0.71, "elapsed_time": "0:00:26", "remaining_time": "1:01:47", "throughput": 5976.82, "total_tokens": 157920} {"current_steps": 245, "total_steps": 33920, "loss": 3.5618, "lr": 7.193396226415095e-07, "epoch": 0.14445754716981132, "percentage": 0.72, "elapsed_time": "0:00:26", "remaining_time": "1:01:35", "throughput": 5975.55, "total_tokens": 160640} {"current_steps": 250, "total_steps": 33920, "loss": 3.6146, "lr": 7.340801886792454e-07, "epoch": 0.1474056603773585, "percentage": 0.74, "elapsed_time": "0:00:27", "remaining_time": "1:01:38", "throughput": 5988.44, "total_tokens": 164448} {"current_steps": 255, "total_steps": 33920, "loss": 3.4774, "lr": 7.488207547169812e-07, "epoch": 0.15035377358490565, "percentage": 0.75, "elapsed_time": "0:00:28", "remaining_time": "1:01:41", "throughput": 5999.0, "total_tokens": 168192} {"current_steps": 260, "total_steps": 33920, "loss": 3.5721, "lr": 7.63561320754717e-07, "epoch": 0.15330188679245282, "percentage": 0.77, "elapsed_time": "0:00:28", "remaining_time": "1:01:49", "throughput": 6009.79, "total_tokens": 172192} {"current_steps": 265, "total_steps": 33920, "loss": 3.4567, "lr": 7.783018867924529e-07, "epoch": 0.15625, "percentage": 0.78, "elapsed_time": "0:00:29", "remaining_time": "1:01:38", "throughput": 6010.01, "total_tokens": 175008} {"current_steps": 270, "total_steps": 33920, "loss": 3.2578, "lr": 7.930424528301888e-07, "epoch": 0.15919811320754718, "percentage": 0.8, "elapsed_time": "0:00:29", "remaining_time": "1:01:29", "throughput": 6008.45, "total_tokens": 177888} {"current_steps": 275, "total_steps": 33920, "loss": 3.0722, "lr": 8.077830188679246e-07, "epoch": 0.16214622641509435, "percentage": 0.81, "elapsed_time": "0:00:30", "remaining_time": "1:01:29", "throughput": 6017.72, "total_tokens": 181472} {"current_steps": 280, "total_steps": 33920, "loss": 3.1394, "lr": 8.225235849056605e-07, "epoch": 0.1650943396226415, "percentage": 0.83, "elapsed_time": "0:00:30", "remaining_time": "1:02:04", "throughput": 6041.94, "total_tokens": 187296} {"current_steps": 285, "total_steps": 33920, "loss": 3.2233, "lr": 8.372641509433963e-07, "epoch": 0.16804245283018868, "percentage": 0.84, "elapsed_time": "0:00:31", "remaining_time": "1:01:49", "throughput": 6031.68, "total_tokens": 189600} {"current_steps": 290, "total_steps": 33920, "loss": 3.3117, "lr": 8.520047169811321e-07, "epoch": 0.17099056603773585, "percentage": 0.85, "elapsed_time": "0:00:31", "remaining_time": "1:01:48", "throughput": 6012.29, "total_tokens": 192256} {"current_steps": 295, "total_steps": 33920, "loss": 3.458, "lr": 8.66745283018868e-07, "epoch": 0.17393867924528303, "percentage": 0.87, "elapsed_time": "0:00:32", "remaining_time": "1:01:38", "throughput": 6014.06, "total_tokens": 195168} {"current_steps": 300, "total_steps": 33920, "loss": 3.4695, "lr": 8.814858490566039e-07, "epoch": 0.17688679245283018, "percentage": 0.88, "elapsed_time": "0:00:32", "remaining_time": "1:01:32", "throughput": 6021.19, "total_tokens": 198368} {"current_steps": 305, "total_steps": 33920, "loss": 3.3337, "lr": 8.962264150943397e-07, "epoch": 0.17983490566037735, "percentage": 0.9, "elapsed_time": "0:00:33", "remaining_time": "1:01:22", "throughput": 6021.73, "total_tokens": 201184} {"current_steps": 310, "total_steps": 33920, "loss": 3.3536, "lr": 9.109669811320755e-07, "epoch": 0.18278301886792453, "percentage": 0.91, "elapsed_time": "0:00:33", "remaining_time": "1:01:16", "throughput": 6015.66, "total_tokens": 204000} {"current_steps": 315, "total_steps": 33920, "loss": 3.1915, "lr": 9.257075471698114e-07, "epoch": 0.1857311320754717, "percentage": 0.93, "elapsed_time": "0:00:34", "remaining_time": "1:01:12", "throughput": 6016.51, "total_tokens": 207136} {"current_steps": 320, "total_steps": 33920, "loss": 2.6377, "lr": 9.404481132075473e-07, "epoch": 0.18867924528301888, "percentage": 0.94, "elapsed_time": "0:00:34", "remaining_time": "1:01:07", "throughput": 6016.04, "total_tokens": 210112} {"current_steps": 325, "total_steps": 33920, "loss": 2.676, "lr": 9.551886792452833e-07, "epoch": 0.19162735849056603, "percentage": 0.96, "elapsed_time": "0:00:35", "remaining_time": "1:00:58", "throughput": 6011.13, "total_tokens": 212736} {"current_steps": 330, "total_steps": 33920, "loss": 2.634, "lr": 9.699292452830188e-07, "epoch": 0.1945754716981132, "percentage": 0.97, "elapsed_time": "0:00:35", "remaining_time": "1:00:51", "throughput": 6009.29, "total_tokens": 215584} {"current_steps": 335, "total_steps": 33920, "loss": 3.4525, "lr": 9.846698113207548e-07, "epoch": 0.19752358490566038, "percentage": 0.99, "elapsed_time": "0:00:36", "remaining_time": "1:00:51", "throughput": 6010.88, "total_tokens": 218912} {"current_steps": 340, "total_steps": 33920, "loss": 2.8842, "lr": 9.994103773584906e-07, "epoch": 0.20047169811320756, "percentage": 1.0, "elapsed_time": "0:00:36", "remaining_time": "1:00:51", "throughput": 6017.06, "total_tokens": 222432} {"current_steps": 345, "total_steps": 33920, "loss": 2.9732, "lr": 1.0141509433962265e-06, "epoch": 0.2034198113207547, "percentage": 1.02, "elapsed_time": "0:00:37", "remaining_time": "1:00:53", "throughput": 6026.9, "total_tokens": 226240} {"current_steps": 350, "total_steps": 33920, "loss": 3.066, "lr": 1.0288915094339623e-06, "epoch": 0.20636792452830188, "percentage": 1.03, "elapsed_time": "0:00:38", "remaining_time": "1:00:53", "throughput": 6034.71, "total_tokens": 229888} {"current_steps": 355, "total_steps": 33920, "loss": 2.8984, "lr": 1.043632075471698e-06, "epoch": 0.20931603773584906, "percentage": 1.05, "elapsed_time": "0:00:38", "remaining_time": "1:01:02", "throughput": 6046.09, "total_tokens": 234176} {"current_steps": 360, "total_steps": 33920, "loss": 3.0836, "lr": 1.058372641509434e-06, "epoch": 0.21226415094339623, "percentage": 1.06, "elapsed_time": "0:00:39", "remaining_time": "1:00:59", "throughput": 6055.07, "total_tokens": 237696} {"current_steps": 365, "total_steps": 33920, "loss": 2.8502, "lr": 1.07311320754717e-06, "epoch": 0.21521226415094338, "percentage": 1.08, "elapsed_time": "0:00:39", "remaining_time": "1:01:01", "throughput": 6064.75, "total_tokens": 241568} {"current_steps": 370, "total_steps": 33920, "loss": 2.7408, "lr": 1.0878537735849056e-06, "epoch": 0.21816037735849056, "percentage": 1.09, "elapsed_time": "0:00:40", "remaining_time": "1:00:52", "throughput": 6056.94, "total_tokens": 243968} {"current_steps": 375, "total_steps": 33920, "loss": 2.5705, "lr": 1.1025943396226416e-06, "epoch": 0.22110849056603774, "percentage": 1.11, "elapsed_time": "0:00:40", "remaining_time": "1:00:44", "throughput": 6054.83, "total_tokens": 246656} {"current_steps": 380, "total_steps": 33920, "loss": 2.7849, "lr": 1.1173349056603773e-06, "epoch": 0.2240566037735849, "percentage": 1.12, "elapsed_time": "0:00:41", "remaining_time": "1:00:47", "throughput": 6063.13, "total_tokens": 250528} {"current_steps": 385, "total_steps": 33920, "loss": 2.6605, "lr": 1.1320754716981133e-06, "epoch": 0.2270047169811321, "percentage": 1.14, "elapsed_time": "0:00:41", "remaining_time": "1:00:40", "throughput": 6059.36, "total_tokens": 253280} {"current_steps": 390, "total_steps": 33920, "loss": 2.659, "lr": 1.1468160377358493e-06, "epoch": 0.22995283018867924, "percentage": 1.15, "elapsed_time": "0:00:42", "remaining_time": "1:00:35", "throughput": 6063.83, "total_tokens": 256448} {"current_steps": 395, "total_steps": 33920, "loss": 2.8954, "lr": 1.1615566037735849e-06, "epoch": 0.2329009433962264, "percentage": 1.16, "elapsed_time": "0:00:42", "remaining_time": "1:00:30", "throughput": 6064.61, "total_tokens": 259392} {"current_steps": 400, "total_steps": 33920, "loss": 2.6005, "lr": 1.1762971698113208e-06, "epoch": 0.2358490566037736, "percentage": 1.18, "elapsed_time": "0:00:43", "remaining_time": "1:00:27", "throughput": 6063.16, "total_tokens": 262432} {"current_steps": 405, "total_steps": 33920, "loss": 2.4863, "lr": 1.1910377358490568e-06, "epoch": 0.23879716981132076, "percentage": 1.19, "elapsed_time": "0:00:43", "remaining_time": "1:00:18", "throughput": 6062.14, "total_tokens": 265088} {"current_steps": 410, "total_steps": 33920, "loss": 2.882, "lr": 1.2057783018867926e-06, "epoch": 0.2417452830188679, "percentage": 1.21, "elapsed_time": "0:00:44", "remaining_time": "1:00:17", "throughput": 6066.5, "total_tokens": 268480} {"current_steps": 415, "total_steps": 33920, "loss": 2.4369, "lr": 1.2205188679245284e-06, "epoch": 0.2446933962264151, "percentage": 1.22, "elapsed_time": "0:00:44", "remaining_time": "1:00:21", "throughput": 6074.2, "total_tokens": 272448} {"current_steps": 420, "total_steps": 33920, "loss": 2.3918, "lr": 1.2352594339622641e-06, "epoch": 0.24764150943396226, "percentage": 1.24, "elapsed_time": "0:00:45", "remaining_time": "1:00:15", "throughput": 6069.99, "total_tokens": 275168} {"current_steps": 425, "total_steps": 33920, "loss": 2.3237, "lr": 1.25e-06, "epoch": 0.2505896226415094, "percentage": 1.25, "elapsed_time": "0:00:45", "remaining_time": "1:00:09", "throughput": 6067.75, "total_tokens": 277888} {"current_steps": 430, "total_steps": 33920, "loss": 2.6138, "lr": 1.264740566037736e-06, "epoch": 0.2535377358490566, "percentage": 1.27, "elapsed_time": "0:00:46", "remaining_time": "1:00:08", "throughput": 6071.46, "total_tokens": 281280} {"current_steps": 435, "total_steps": 33920, "loss": 2.642, "lr": 1.2794811320754718e-06, "epoch": 0.25648584905660377, "percentage": 1.28, "elapsed_time": "0:00:46", "remaining_time": "1:00:01", "throughput": 6067.48, "total_tokens": 283904} {"current_steps": 440, "total_steps": 33920, "loss": 2.586, "lr": 1.2942216981132078e-06, "epoch": 0.25943396226415094, "percentage": 1.3, "elapsed_time": "0:00:47", "remaining_time": "0:59:54", "throughput": 6065.18, "total_tokens": 286528} {"current_steps": 445, "total_steps": 33920, "loss": 2.555, "lr": 1.3089622641509436e-06, "epoch": 0.2623820754716981, "percentage": 1.31, "elapsed_time": "0:00:47", "remaining_time": "0:59:56", "throughput": 6067.32, "total_tokens": 290048} {"current_steps": 450, "total_steps": 33920, "loss": 2.4563, "lr": 1.3237028301886792e-06, "epoch": 0.2653301886792453, "percentage": 1.33, "elapsed_time": "0:00:48", "remaining_time": "1:00:00", "throughput": 6075.05, "total_tokens": 294080} {"current_steps": 455, "total_steps": 33920, "loss": 2.7682, "lr": 1.3384433962264151e-06, "epoch": 0.26827830188679247, "percentage": 1.34, "elapsed_time": "0:00:48", "remaining_time": "0:59:53", "throughput": 6070.33, "total_tokens": 296608} {"current_steps": 460, "total_steps": 33920, "loss": 2.4682, "lr": 1.353183962264151e-06, "epoch": 0.27122641509433965, "percentage": 1.36, "elapsed_time": "0:00:49", "remaining_time": "0:59:47", "throughput": 6065.2, "total_tokens": 299136} {"current_steps": 465, "total_steps": 33920, "loss": 2.3755, "lr": 1.3679245283018869e-06, "epoch": 0.27417452830188677, "percentage": 1.37, "elapsed_time": "0:00:49", "remaining_time": "0:59:45", "throughput": 6063.98, "total_tokens": 302240} {"current_steps": 470, "total_steps": 33920, "loss": 2.2079, "lr": 1.3826650943396229e-06, "epoch": 0.27712264150943394, "percentage": 1.39, "elapsed_time": "0:00:50", "remaining_time": "0:59:46", "throughput": 6069.53, "total_tokens": 305888} {"current_steps": 475, "total_steps": 33920, "loss": 2.7853, "lr": 1.3974056603773586e-06, "epoch": 0.2800707547169811, "percentage": 1.4, "elapsed_time": "0:00:50", "remaining_time": "0:59:44", "throughput": 6068.88, "total_tokens": 308992} {"current_steps": 480, "total_steps": 33920, "loss": 2.7675, "lr": 1.4121462264150946e-06, "epoch": 0.2830188679245283, "percentage": 1.42, "elapsed_time": "0:00:51", "remaining_time": "0:59:37", "throughput": 6063.91, "total_tokens": 311360} {"current_steps": 485, "total_steps": 33920, "loss": 2.2163, "lr": 1.4268867924528304e-06, "epoch": 0.28596698113207547, "percentage": 1.43, "elapsed_time": "0:00:51", "remaining_time": "0:59:30", "throughput": 6059.99, "total_tokens": 313824} {"current_steps": 490, "total_steps": 33920, "loss": 2.5636, "lr": 1.4416273584905664e-06, "epoch": 0.28891509433962265, "percentage": 1.44, "elapsed_time": "0:00:52", "remaining_time": "0:59:25", "throughput": 6059.46, "total_tokens": 316640} {"current_steps": 495, "total_steps": 33920, "loss": 2.1607, "lr": 1.456367924528302e-06, "epoch": 0.2918632075471698, "percentage": 1.46, "elapsed_time": "0:00:52", "remaining_time": "0:59:28", "throughput": 6065.31, "total_tokens": 320576} {"current_steps": 500, "total_steps": 33920, "loss": 2.4592, "lr": 1.4711084905660377e-06, "epoch": 0.294811320754717, "percentage": 1.47, "elapsed_time": "0:00:53", "remaining_time": "0:59:29", "throughput": 6071.95, "total_tokens": 324288} {"current_steps": 505, "total_steps": 33920, "loss": 2.2579, "lr": 1.4858490566037737e-06, "epoch": 0.2977594339622642, "percentage": 1.49, "elapsed_time": "0:00:53", "remaining_time": "0:59:24", "throughput": 6071.75, "total_tokens": 327072} {"current_steps": 510, "total_steps": 33920, "loss": 2.2751, "lr": 1.5005896226415096e-06, "epoch": 0.3007075471698113, "percentage": 1.5, "elapsed_time": "0:00:54", "remaining_time": "0:59:18", "throughput": 6064.18, "total_tokens": 329408} {"current_steps": 515, "total_steps": 33920, "loss": 2.1318, "lr": 1.5153301886792454e-06, "epoch": 0.30365566037735847, "percentage": 1.52, "elapsed_time": "0:00:54", "remaining_time": "0:59:16", "throughput": 6067.98, "total_tokens": 332704} {"current_steps": 520, "total_steps": 33920, "loss": 2.4837, "lr": 1.5300707547169814e-06, "epoch": 0.30660377358490565, "percentage": 1.53, "elapsed_time": "0:00:55", "remaining_time": "0:59:11", "throughput": 6068.41, "total_tokens": 335552} {"current_steps": 525, "total_steps": 33920, "loss": 2.3355, "lr": 1.5448113207547172e-06, "epoch": 0.3095518867924528, "percentage": 1.55, "elapsed_time": "0:00:55", "remaining_time": "0:59:07", "throughput": 6070.46, "total_tokens": 338560} {"current_steps": 530, "total_steps": 33920, "loss": 2.1778, "lr": 1.5595518867924531e-06, "epoch": 0.3125, "percentage": 1.56, "elapsed_time": "0:00:56", "remaining_time": "0:59:12", "throughput": 6075.3, "total_tokens": 342592} {"current_steps": 535, "total_steps": 33920, "loss": 1.9473, "lr": 1.574292452830189e-06, "epoch": 0.3154481132075472, "percentage": 1.58, "elapsed_time": "0:00:56", "remaining_time": "0:59:13", "throughput": 6079.71, "total_tokens": 346176} {"current_steps": 540, "total_steps": 33920, "loss": 1.8161, "lr": 1.5890330188679245e-06, "epoch": 0.31839622641509435, "percentage": 1.59, "elapsed_time": "0:00:57", "remaining_time": "0:59:18", "throughput": 6087.39, "total_tokens": 350464} {"current_steps": 545, "total_steps": 33920, "loss": 2.2977, "lr": 1.6037735849056604e-06, "epoch": 0.32134433962264153, "percentage": 1.61, "elapsed_time": "0:00:58", "remaining_time": "0:59:21", "throughput": 6085.21, "total_tokens": 353856} {"current_steps": 550, "total_steps": 33920, "loss": 1.9008, "lr": 1.6185141509433964e-06, "epoch": 0.3242924528301887, "percentage": 1.62, "elapsed_time": "0:00:58", "remaining_time": "0:59:17", "throughput": 6081.74, "total_tokens": 356608} {"current_steps": 555, "total_steps": 33920, "loss": 2.6972, "lr": 1.6332547169811322e-06, "epoch": 0.3272405660377358, "percentage": 1.64, "elapsed_time": "0:00:59", "remaining_time": "0:59:13", "throughput": 6083.04, "total_tokens": 359520} {"current_steps": 560, "total_steps": 33920, "loss": 2.1941, "lr": 1.6479952830188682e-06, "epoch": 0.330188679245283, "percentage": 1.65, "elapsed_time": "0:00:59", "remaining_time": "0:59:16", "throughput": 6089.86, "total_tokens": 363616} {"current_steps": 565, "total_steps": 33920, "loss": 2.5141, "lr": 1.662735849056604e-06, "epoch": 0.3331367924528302, "percentage": 1.67, "elapsed_time": "0:01:00", "remaining_time": "0:59:12", "throughput": 6088.09, "total_tokens": 366336} {"current_steps": 570, "total_steps": 33920, "loss": 2.0076, "lr": 1.67747641509434e-06, "epoch": 0.33608490566037735, "percentage": 1.68, "elapsed_time": "0:01:00", "remaining_time": "0:59:10", "throughput": 6090.55, "total_tokens": 369632} {"current_steps": 575, "total_steps": 33920, "loss": 1.975, "lr": 1.6922169811320757e-06, "epoch": 0.33903301886792453, "percentage": 1.7, "elapsed_time": "0:01:01", "remaining_time": "0:59:11", "throughput": 6094.81, "total_tokens": 373280} {"current_steps": 580, "total_steps": 33920, "loss": 2.4221, "lr": 1.7069575471698112e-06, "epoch": 0.3419811320754717, "percentage": 1.71, "elapsed_time": "0:01:01", "remaining_time": "0:59:22", "throughput": 6102.69, "total_tokens": 378176} {"current_steps": 585, "total_steps": 33920, "loss": 1.9371, "lr": 1.7216981132075472e-06, "epoch": 0.3449292452830189, "percentage": 1.72, "elapsed_time": "0:01:02", "remaining_time": "0:59:16", "throughput": 6103.57, "total_tokens": 380992} {"current_steps": 590, "total_steps": 33920, "loss": 2.1914, "lr": 1.736438679245283e-06, "epoch": 0.34787735849056606, "percentage": 1.74, "elapsed_time": "0:01:02", "remaining_time": "0:59:13", "throughput": 6102.68, "total_tokens": 383840} {"current_steps": 595, "total_steps": 33920, "loss": 1.7578, "lr": 1.751179245283019e-06, "epoch": 0.35082547169811323, "percentage": 1.75, "elapsed_time": "0:01:03", "remaining_time": "0:59:08", "throughput": 6103.92, "total_tokens": 386720} {"current_steps": 600, "total_steps": 33920, "loss": 2.049, "lr": 1.765919811320755e-06, "epoch": 0.35377358490566035, "percentage": 1.77, "elapsed_time": "0:01:03", "remaining_time": "0:59:04", "throughput": 6105.06, "total_tokens": 389664} {"current_steps": 605, "total_steps": 33920, "loss": 2.5405, "lr": 1.7806603773584907e-06, "epoch": 0.35672169811320753, "percentage": 1.78, "elapsed_time": "0:01:04", "remaining_time": "0:59:04", "throughput": 6106.35, "total_tokens": 393024} {"current_steps": 610, "total_steps": 33920, "loss": 1.9969, "lr": 1.7954009433962267e-06, "epoch": 0.3596698113207547, "percentage": 1.8, "elapsed_time": "0:01:04", "remaining_time": "0:59:04", "throughput": 6109.35, "total_tokens": 396576} {"current_steps": 615, "total_steps": 33920, "loss": 2.3094, "lr": 1.8101415094339625e-06, "epoch": 0.3626179245283019, "percentage": 1.81, "elapsed_time": "0:01:05", "remaining_time": "0:59:00", "throughput": 6110.78, "total_tokens": 399488} {"current_steps": 620, "total_steps": 33920, "loss": 1.9377, "lr": 1.8248820754716984e-06, "epoch": 0.36556603773584906, "percentage": 1.83, "elapsed_time": "0:01:05", "remaining_time": "0:58:56", "throughput": 6112.15, "total_tokens": 402496} {"current_steps": 625, "total_steps": 33920, "loss": 1.7228, "lr": 1.839622641509434e-06, "epoch": 0.36851415094339623, "percentage": 1.84, "elapsed_time": "0:01:06", "remaining_time": "0:58:55", "throughput": 6111.1, "total_tokens": 405568} {"current_steps": 630, "total_steps": 33920, "loss": 1.8129, "lr": 1.8543632075471698e-06, "epoch": 0.3714622641509434, "percentage": 1.86, "elapsed_time": "0:01:06", "remaining_time": "0:58:52", "throughput": 6108.63, "total_tokens": 408416} {"current_steps": 635, "total_steps": 33920, "loss": 1.7833, "lr": 1.8691037735849057e-06, "epoch": 0.3744103773584906, "percentage": 1.87, "elapsed_time": "0:01:07", "remaining_time": "0:58:50", "throughput": 6107.97, "total_tokens": 411360} {"current_steps": 640, "total_steps": 33920, "loss": 1.6358, "lr": 1.8838443396226417e-06, "epoch": 0.37735849056603776, "percentage": 1.89, "elapsed_time": "0:01:07", "remaining_time": "0:58:47", "throughput": 6104.98, "total_tokens": 414112} {"current_steps": 645, "total_steps": 33920, "loss": 1.7158, "lr": 1.8985849056603775e-06, "epoch": 0.3803066037735849, "percentage": 1.9, "elapsed_time": "0:01:08", "remaining_time": "0:58:46", "throughput": 6107.0, "total_tokens": 417408} {"current_steps": 650, "total_steps": 33920, "loss": 1.8702, "lr": 1.9133254716981133e-06, "epoch": 0.38325471698113206, "percentage": 1.92, "elapsed_time": "0:01:08", "remaining_time": "0:58:44", "throughput": 6108.57, "total_tokens": 420640} {"current_steps": 655, "total_steps": 33920, "loss": 1.9492, "lr": 1.9280660377358494e-06, "epoch": 0.38620283018867924, "percentage": 1.93, "elapsed_time": "0:01:09", "remaining_time": "0:58:38", "throughput": 6100.81, "total_tokens": 422688} {"current_steps": 660, "total_steps": 33920, "loss": 2.083, "lr": 1.9428066037735852e-06, "epoch": 0.3891509433962264, "percentage": 1.95, "elapsed_time": "0:01:09", "remaining_time": "0:58:44", "throughput": 6107.86, "total_tokens": 427136} {"current_steps": 665, "total_steps": 33920, "loss": 1.7583, "lr": 1.957547169811321e-06, "epoch": 0.3920990566037736, "percentage": 1.96, "elapsed_time": "0:01:10", "remaining_time": "0:58:42", "throughput": 6110.23, "total_tokens": 430400} {"current_steps": 670, "total_steps": 33920, "loss": 1.7232, "lr": 1.9722877358490568e-06, "epoch": 0.39504716981132076, "percentage": 1.98, "elapsed_time": "0:01:10", "remaining_time": "0:58:40", "throughput": 6112.88, "total_tokens": 433632} {"current_steps": 675, "total_steps": 33920, "loss": 1.8499, "lr": 1.9870283018867925e-06, "epoch": 0.39799528301886794, "percentage": 1.99, "elapsed_time": "0:01:11", "remaining_time": "0:58:39", "throughput": 6115.02, "total_tokens": 436960} {"current_steps": 680, "total_steps": 33920, "loss": 1.5063, "lr": 2.0017688679245283e-06, "epoch": 0.4009433962264151, "percentage": 2.0, "elapsed_time": "0:01:11", "remaining_time": "0:58:38", "throughput": 6112.81, "total_tokens": 439968} {"current_steps": 685, "total_steps": 33920, "loss": 1.5491, "lr": 2.0165094339622645e-06, "epoch": 0.40389150943396224, "percentage": 2.02, "elapsed_time": "0:01:12", "remaining_time": "0:58:36", "throughput": 6114.1, "total_tokens": 443168} {"current_steps": 690, "total_steps": 33920, "loss": 1.5964, "lr": 2.0312500000000002e-06, "epoch": 0.4068396226415094, "percentage": 2.03, "elapsed_time": "0:01:12", "remaining_time": "0:58:33", "throughput": 6113.35, "total_tokens": 445984} {"current_steps": 695, "total_steps": 33920, "loss": 1.7867, "lr": 2.045990566037736e-06, "epoch": 0.4097877358490566, "percentage": 2.05, "elapsed_time": "0:01:13", "remaining_time": "0:58:31", "throughput": 6115.95, "total_tokens": 449280} {"current_steps": 700, "total_steps": 33920, "loss": 1.5458, "lr": 2.0607311320754718e-06, "epoch": 0.41273584905660377, "percentage": 2.06, "elapsed_time": "0:01:13", "remaining_time": "0:58:31", "throughput": 6119.52, "total_tokens": 452832} {"current_steps": 705, "total_steps": 33920, "loss": 1.3588, "lr": 2.075471698113208e-06, "epoch": 0.41568396226415094, "percentage": 2.08, "elapsed_time": "0:01:14", "remaining_time": "0:58:27", "throughput": 6116.35, "total_tokens": 455360} {"current_steps": 710, "total_steps": 33920, "loss": 1.3306, "lr": 2.0902122641509437e-06, "epoch": 0.4186320754716981, "percentage": 2.09, "elapsed_time": "0:01:15", "remaining_time": "0:58:28", "throughput": 6118.29, "total_tokens": 458944} {"current_steps": 715, "total_steps": 33920, "loss": 1.4604, "lr": 2.1049528301886795e-06, "epoch": 0.4215801886792453, "percentage": 2.11, "elapsed_time": "0:01:15", "remaining_time": "0:58:28", "throughput": 6116.47, "total_tokens": 462080} {"current_steps": 720, "total_steps": 33920, "loss": 1.3827, "lr": 2.1196933962264153e-06, "epoch": 0.42452830188679247, "percentage": 2.12, "elapsed_time": "0:01:16", "remaining_time": "0:58:31", "throughput": 6118.12, "total_tokens": 465888} {"current_steps": 725, "total_steps": 33920, "loss": 1.6747, "lr": 2.134433962264151e-06, "epoch": 0.42747641509433965, "percentage": 2.14, "elapsed_time": "0:01:16", "remaining_time": "0:58:29", "throughput": 6117.64, "total_tokens": 468928} {"current_steps": 730, "total_steps": 33920, "loss": 0.9826, "lr": 2.149174528301887e-06, "epoch": 0.43042452830188677, "percentage": 2.15, "elapsed_time": "0:01:17", "remaining_time": "0:58:28", "throughput": 6117.81, "total_tokens": 472032} {"current_steps": 735, "total_steps": 33920, "loss": 1.2454, "lr": 2.163915094339623e-06, "epoch": 0.43337264150943394, "percentage": 2.17, "elapsed_time": "0:01:17", "remaining_time": "0:58:24", "throughput": 6116.79, "total_tokens": 474816} {"current_steps": 740, "total_steps": 33920, "loss": 1.61, "lr": 2.1786556603773588e-06, "epoch": 0.4363207547169811, "percentage": 2.18, "elapsed_time": "0:01:18", "remaining_time": "0:58:20", "throughput": 6114.78, "total_tokens": 477344} {"current_steps": 745, "total_steps": 33920, "loss": 1.2651, "lr": 2.1933962264150945e-06, "epoch": 0.4392688679245283, "percentage": 2.2, "elapsed_time": "0:01:18", "remaining_time": "0:58:17", "throughput": 6112.99, "total_tokens": 480096} {"current_steps": 750, "total_steps": 33920, "loss": 0.9204, "lr": 2.2081367924528303e-06, "epoch": 0.44221698113207547, "percentage": 2.21, "elapsed_time": "0:01:19", "remaining_time": "0:58:18", "throughput": 6114.74, "total_tokens": 483712} {"current_steps": 755, "total_steps": 33920, "loss": 0.9592, "lr": 2.2228773584905665e-06, "epoch": 0.44516509433962265, "percentage": 2.23, "elapsed_time": "0:01:19", "remaining_time": "0:58:17", "throughput": 6117.51, "total_tokens": 487072} {"current_steps": 760, "total_steps": 33920, "loss": 1.185, "lr": 2.237617924528302e-06, "epoch": 0.4481132075471698, "percentage": 2.24, "elapsed_time": "0:01:20", "remaining_time": "0:58:16", "throughput": 6119.18, "total_tokens": 490432} {"current_steps": 765, "total_steps": 33920, "loss": 0.8052, "lr": 2.252358490566038e-06, "epoch": 0.451061320754717, "percentage": 2.26, "elapsed_time": "0:01:20", "remaining_time": "0:58:15", "throughput": 6118.88, "total_tokens": 493440} {"current_steps": 770, "total_steps": 33920, "loss": 0.947, "lr": 2.267099056603774e-06, "epoch": 0.4540094339622642, "percentage": 2.27, "elapsed_time": "0:01:21", "remaining_time": "0:58:12", "throughput": 6114.45, "total_tokens": 496000} {"current_steps": 775, "total_steps": 33920, "loss": 0.9103, "lr": 2.2818396226415096e-06, "epoch": 0.4569575471698113, "percentage": 2.28, "elapsed_time": "0:01:21", "remaining_time": "0:58:14", "throughput": 6118.21, "total_tokens": 499904} {"current_steps": 780, "total_steps": 33920, "loss": 0.9831, "lr": 2.2965801886792453e-06, "epoch": 0.45990566037735847, "percentage": 2.3, "elapsed_time": "0:01:22", "remaining_time": "0:58:18", "throughput": 6124.12, "total_tokens": 504256} {"current_steps": 785, "total_steps": 33920, "loss": 0.7673, "lr": 2.3113207547169815e-06, "epoch": 0.46285377358490565, "percentage": 2.31, "elapsed_time": "0:01:22", "remaining_time": "0:58:18", "throughput": 6124.94, "total_tokens": 507616} {"current_steps": 790, "total_steps": 33920, "loss": 1.0915, "lr": 2.3260613207547173e-06, "epoch": 0.4658018867924528, "percentage": 2.33, "elapsed_time": "0:01:23", "remaining_time": "0:58:16", "throughput": 6126.17, "total_tokens": 510720} {"current_steps": 795, "total_steps": 33920, "loss": 0.8194, "lr": 2.340801886792453e-06, "epoch": 0.46875, "percentage": 2.34, "elapsed_time": "0:01:23", "remaining_time": "0:58:14", "throughput": 6128.3, "total_tokens": 514016} {"current_steps": 800, "total_steps": 33920, "loss": 0.8714, "lr": 2.355542452830189e-06, "epoch": 0.4716981132075472, "percentage": 2.36, "elapsed_time": "0:01:24", "remaining_time": "0:58:12", "throughput": 6129.2, "total_tokens": 517024} {"current_steps": 805, "total_steps": 33920, "loss": 1.102, "lr": 2.3702830188679246e-06, "epoch": 0.47464622641509435, "percentage": 2.37, "elapsed_time": "0:01:24", "remaining_time": "0:58:10", "throughput": 6127.87, "total_tokens": 520032} {"current_steps": 810, "total_steps": 33920, "loss": 0.9178, "lr": 2.3850235849056604e-06, "epoch": 0.47759433962264153, "percentage": 2.39, "elapsed_time": "0:01:25", "remaining_time": "0:58:09", "throughput": 6129.95, "total_tokens": 523232} {"current_steps": 815, "total_steps": 33920, "loss": 0.8341, "lr": 2.3997641509433966e-06, "epoch": 0.4805424528301887, "percentage": 2.4, "elapsed_time": "0:01:25", "remaining_time": "0:58:06", "throughput": 6129.42, "total_tokens": 526080} {"current_steps": 820, "total_steps": 33920, "loss": 0.8807, "lr": 2.4145047169811323e-06, "epoch": 0.4834905660377358, "percentage": 2.42, "elapsed_time": "0:01:26", "remaining_time": "0:58:01", "throughput": 6125.67, "total_tokens": 528384} {"current_steps": 825, "total_steps": 33920, "loss": 0.699, "lr": 2.429245283018868e-06, "epoch": 0.486438679245283, "percentage": 2.43, "elapsed_time": "0:01:26", "remaining_time": "0:58:01", "throughput": 6128.36, "total_tokens": 531808} {"current_steps": 830, "total_steps": 33920, "loss": 0.9971, "lr": 2.443985849056604e-06, "epoch": 0.4893867924528302, "percentage": 2.45, "elapsed_time": "0:01:27", "remaining_time": "0:58:01", "throughput": 6130.82, "total_tokens": 535392} {"current_steps": 835, "total_steps": 33920, "loss": 0.9152, "lr": 2.45872641509434e-06, "epoch": 0.49233490566037735, "percentage": 2.46, "elapsed_time": "0:01:27", "remaining_time": "0:58:00", "throughput": 6132.98, "total_tokens": 538752} {"current_steps": 840, "total_steps": 33920, "loss": 0.8088, "lr": 2.473466981132076e-06, "epoch": 0.49528301886792453, "percentage": 2.48, "elapsed_time": "0:01:28", "remaining_time": "0:58:00", "throughput": 6131.93, "total_tokens": 541920} {"current_steps": 845, "total_steps": 33920, "loss": 0.856, "lr": 2.4882075471698116e-06, "epoch": 0.4982311320754717, "percentage": 2.49, "elapsed_time": "0:01:28", "remaining_time": "0:57:58", "throughput": 6133.13, "total_tokens": 545024} {"current_steps": 850, "total_steps": 33920, "loss": 0.8352, "lr": 2.5029481132075474e-06, "epoch": 0.5011792452830188, "percentage": 2.51, "elapsed_time": "0:01:29", "remaining_time": "0:57:57", "throughput": 6134.8, "total_tokens": 548384} {"current_steps": 855, "total_steps": 33920, "loss": 0.8574, "lr": 2.517688679245283e-06, "epoch": 0.504127358490566, "percentage": 2.52, "elapsed_time": "0:01:29", "remaining_time": "0:57:57", "throughput": 6135.01, "total_tokens": 551712} {"current_steps": 860, "total_steps": 33920, "loss": 0.7831, "lr": 2.532429245283019e-06, "epoch": 0.5070754716981132, "percentage": 2.54, "elapsed_time": "0:01:30", "remaining_time": "0:57:55", "throughput": 6134.66, "total_tokens": 554688} {"current_steps": 865, "total_steps": 33920, "loss": 1.0198, "lr": 2.547169811320755e-06, "epoch": 0.5100235849056604, "percentage": 2.55, "elapsed_time": "0:01:30", "remaining_time": "0:57:55", "throughput": 6133.95, "total_tokens": 557888} {"current_steps": 870, "total_steps": 33920, "loss": 0.7339, "lr": 2.561910377358491e-06, "epoch": 0.5129716981132075, "percentage": 2.56, "elapsed_time": "0:01:31", "remaining_time": "0:57:57", "throughput": 6138.2, "total_tokens": 561856} {"current_steps": 875, "total_steps": 33920, "loss": 0.711, "lr": 2.5766509433962266e-06, "epoch": 0.5159198113207547, "percentage": 2.58, "elapsed_time": "0:01:32", "remaining_time": "0:57:56", "throughput": 6137.26, "total_tokens": 565024} {"current_steps": 880, "total_steps": 33920, "loss": 0.9388, "lr": 2.5913915094339624e-06, "epoch": 0.5188679245283019, "percentage": 2.59, "elapsed_time": "0:01:32", "remaining_time": "0:57:56", "throughput": 6138.81, "total_tokens": 568480} {"current_steps": 885, "total_steps": 33920, "loss": 1.1166, "lr": 2.6061320754716986e-06, "epoch": 0.5218160377358491, "percentage": 2.61, "elapsed_time": "0:01:33", "remaining_time": "0:57:57", "throughput": 6140.74, "total_tokens": 572096} {"current_steps": 890, "total_steps": 33920, "loss": 0.9136, "lr": 2.6208726415094343e-06, "epoch": 0.5247641509433962, "percentage": 2.62, "elapsed_time": "0:01:33", "remaining_time": "0:57:57", "throughput": 6142.01, "total_tokens": 575520} {"current_steps": 895, "total_steps": 33920, "loss": 0.748, "lr": 2.63561320754717e-06, "epoch": 0.5277122641509434, "percentage": 2.64, "elapsed_time": "0:01:34", "remaining_time": "0:57:56", "throughput": 6143.83, "total_tokens": 578848} {"current_steps": 900, "total_steps": 33920, "loss": 0.6337, "lr": 2.650353773584906e-06, "epoch": 0.5306603773584906, "percentage": 2.65, "elapsed_time": "0:01:34", "remaining_time": "0:57:59", "throughput": 6147.41, "total_tokens": 583008} {"current_steps": 905, "total_steps": 33920, "loss": 0.7095, "lr": 2.665094339622642e-06, "epoch": 0.5336084905660378, "percentage": 2.67, "elapsed_time": "0:01:35", "remaining_time": "0:57:59", "throughput": 6148.63, "total_tokens": 586432} {"current_steps": 910, "total_steps": 33920, "loss": 0.877, "lr": 2.679834905660378e-06, "epoch": 0.5365566037735849, "percentage": 2.68, "elapsed_time": "0:01:35", "remaining_time": "0:57:57", "throughput": 6149.5, "total_tokens": 589568} {"current_steps": 915, "total_steps": 33920, "loss": 0.7737, "lr": 2.694575471698113e-06, "epoch": 0.5395047169811321, "percentage": 2.7, "elapsed_time": "0:01:36", "remaining_time": "0:57:55", "throughput": 6148.15, "total_tokens": 592416} {"current_steps": 920, "total_steps": 33920, "loss": 0.4487, "lr": 2.709316037735849e-06, "epoch": 0.5424528301886793, "percentage": 2.71, "elapsed_time": "0:01:36", "remaining_time": "0:57:53", "throughput": 6149.47, "total_tokens": 595552} {"current_steps": 925, "total_steps": 33920, "loss": 0.5329, "lr": 2.724056603773585e-06, "epoch": 0.5454009433962265, "percentage": 2.73, "elapsed_time": "0:01:37", "remaining_time": "0:57:54", "throughput": 6151.37, "total_tokens": 599104} {"current_steps": 930, "total_steps": 33920, "loss": 0.5568, "lr": 2.738797169811321e-06, "epoch": 0.5483490566037735, "percentage": 2.74, "elapsed_time": "0:01:37", "remaining_time": "0:57:52", "throughput": 6152.78, "total_tokens": 602304} {"current_steps": 935, "total_steps": 33920, "loss": 0.947, "lr": 2.7535377358490567e-06, "epoch": 0.5512971698113207, "percentage": 2.76, "elapsed_time": "0:01:38", "remaining_time": "0:57:50", "throughput": 6153.14, "total_tokens": 605376} {"current_steps": 940, "total_steps": 33920, "loss": 0.9636, "lr": 2.7682783018867925e-06, "epoch": 0.5542452830188679, "percentage": 2.77, "elapsed_time": "0:01:38", "remaining_time": "0:57:46", "throughput": 6149.7, "total_tokens": 607648} {"current_steps": 945, "total_steps": 33920, "loss": 0.7103, "lr": 2.7830188679245286e-06, "epoch": 0.5571933962264151, "percentage": 2.79, "elapsed_time": "0:01:39", "remaining_time": "0:57:46", "throughput": 6151.92, "total_tokens": 611232} {"current_steps": 950, "total_steps": 33920, "loss": 0.6143, "lr": 2.7977594339622644e-06, "epoch": 0.5601415094339622, "percentage": 2.8, "elapsed_time": "0:01:40", "remaining_time": "0:57:51", "throughput": 6155.4, "total_tokens": 615776} {"current_steps": 955, "total_steps": 33920, "loss": 0.842, "lr": 2.8125e-06, "epoch": 0.5630896226415094, "percentage": 2.82, "elapsed_time": "0:01:40", "remaining_time": "0:57:50", "throughput": 6153.66, "total_tokens": 618656} {"current_steps": 960, "total_steps": 33920, "loss": 0.6467, "lr": 2.827240566037736e-06, "epoch": 0.5660377358490566, "percentage": 2.83, "elapsed_time": "0:01:41", "remaining_time": "0:57:51", "throughput": 6156.77, "total_tokens": 622528} {"current_steps": 965, "total_steps": 33920, "loss": 0.6852, "lr": 2.841981132075472e-06, "epoch": 0.5689858490566038, "percentage": 2.84, "elapsed_time": "0:01:41", "remaining_time": "0:57:51", "throughput": 6158.23, "total_tokens": 625920} {"current_steps": 970, "total_steps": 33920, "loss": 0.6648, "lr": 2.856721698113208e-06, "epoch": 0.5719339622641509, "percentage": 2.86, "elapsed_time": "0:01:42", "remaining_time": "0:57:48", "throughput": 6155.76, "total_tokens": 628544} {"current_steps": 975, "total_steps": 33920, "loss": 0.7258, "lr": 2.8714622641509437e-06, "epoch": 0.5748820754716981, "percentage": 2.87, "elapsed_time": "0:01:42", "remaining_time": "0:57:45", "throughput": 6152.87, "total_tokens": 631072} {"current_steps": 980, "total_steps": 33920, "loss": 0.6933, "lr": 2.8862028301886794e-06, "epoch": 0.5778301886792453, "percentage": 2.89, "elapsed_time": "0:01:42", "remaining_time": "0:57:41", "throughput": 6150.71, "total_tokens": 633504} {"current_steps": 985, "total_steps": 33920, "loss": 0.7531, "lr": 2.9009433962264156e-06, "epoch": 0.5807783018867925, "percentage": 2.9, "elapsed_time": "0:01:43", "remaining_time": "0:57:40", "throughput": 6152.31, "total_tokens": 636800} {"current_steps": 990, "total_steps": 33920, "loss": 0.5618, "lr": 2.9156839622641514e-06, "epoch": 0.5837264150943396, "percentage": 2.92, "elapsed_time": "0:01:44", "remaining_time": "0:57:40", "throughput": 6153.74, "total_tokens": 640160} {"current_steps": 995, "total_steps": 33920, "loss": 0.7435, "lr": 2.930424528301887e-06, "epoch": 0.5866745283018868, "percentage": 2.93, "elapsed_time": "0:01:44", "remaining_time": "0:57:42", "throughput": 6154.83, "total_tokens": 643936} {"current_steps": 1000, "total_steps": 33920, "loss": 0.5652, "lr": 2.9451650943396225e-06, "epoch": 0.589622641509434, "percentage": 2.95, "elapsed_time": "0:01:45", "remaining_time": "0:57:45", "throughput": 6159.37, "total_tokens": 648384} {"current_steps": 1005, "total_steps": 33920, "loss": 0.6299, "lr": 2.9599056603773587e-06, "epoch": 0.5925707547169812, "percentage": 2.96, "elapsed_time": "0:01:45", "remaining_time": "0:57:43", "throughput": 6158.25, "total_tokens": 651168} {"current_steps": 1010, "total_steps": 33920, "loss": 0.7942, "lr": 2.9746462264150945e-06, "epoch": 0.5955188679245284, "percentage": 2.98, "elapsed_time": "0:01:46", "remaining_time": "0:57:41", "throughput": 6158.59, "total_tokens": 654272} {"current_steps": 1015, "total_steps": 33920, "loss": 0.5136, "lr": 2.9893867924528302e-06, "epoch": 0.5984669811320755, "percentage": 2.99, "elapsed_time": "0:01:46", "remaining_time": "0:57:41", "throughput": 6160.79, "total_tokens": 657824} {"current_steps": 1020, "total_steps": 33920, "loss": 0.6794, "lr": 3.004127358490566e-06, "epoch": 0.6014150943396226, "percentage": 3.01, "elapsed_time": "0:01:47", "remaining_time": "0:57:41", "throughput": 6161.4, "total_tokens": 661184} {"current_steps": 1025, "total_steps": 33920, "loss": 0.6936, "lr": 3.018867924528302e-06, "epoch": 0.6043632075471698, "percentage": 3.02, "elapsed_time": "0:01:47", "remaining_time": "0:57:42", "throughput": 6164.54, "total_tokens": 665184} {"current_steps": 1030, "total_steps": 33920, "loss": 0.5847, "lr": 3.033608490566038e-06, "epoch": 0.6073113207547169, "percentage": 3.04, "elapsed_time": "0:01:48", "remaining_time": "0:57:40", "throughput": 6164.03, "total_tokens": 667968} {"current_steps": 1035, "total_steps": 33920, "loss": 0.5575, "lr": 3.0483490566037737e-06, "epoch": 0.6102594339622641, "percentage": 3.05, "elapsed_time": "0:01:48", "remaining_time": "0:57:40", "throughput": 6164.04, "total_tokens": 671360} {"current_steps": 1040, "total_steps": 33920, "loss": 0.5811, "lr": 3.0630896226415095e-06, "epoch": 0.6132075471698113, "percentage": 3.07, "elapsed_time": "0:01:49", "remaining_time": "0:57:38", "throughput": 6163.8, "total_tokens": 674336} {"current_steps": 1045, "total_steps": 33920, "loss": 0.5332, "lr": 3.0778301886792457e-06, "epoch": 0.6161556603773585, "percentage": 3.08, "elapsed_time": "0:01:49", "remaining_time": "0:57:37", "throughput": 6164.43, "total_tokens": 677504} {"current_steps": 1050, "total_steps": 33920, "loss": 0.6762, "lr": 3.0925707547169815e-06, "epoch": 0.6191037735849056, "percentage": 3.1, "elapsed_time": "0:01:50", "remaining_time": "0:57:36", "throughput": 6165.91, "total_tokens": 680864} {"current_steps": 1055, "total_steps": 33920, "loss": 0.6861, "lr": 3.1073113207547172e-06, "epoch": 0.6220518867924528, "percentage": 3.11, "elapsed_time": "0:01:50", "remaining_time": "0:57:34", "throughput": 6165.59, "total_tokens": 683776} {"current_steps": 1060, "total_steps": 33920, "loss": 0.6801, "lr": 3.122051886792453e-06, "epoch": 0.625, "percentage": 3.12, "elapsed_time": "0:01:51", "remaining_time": "0:57:33", "throughput": 6165.24, "total_tokens": 686784} {"current_steps": 1065, "total_steps": 33920, "loss": 0.5865, "lr": 3.136792452830189e-06, "epoch": 0.6279481132075472, "percentage": 3.14, "elapsed_time": "0:01:51", "remaining_time": "0:57:33", "throughput": 6165.77, "total_tokens": 690208} {"current_steps": 1070, "total_steps": 33920, "loss": 0.7595, "lr": 3.151533018867925e-06, "epoch": 0.6308962264150944, "percentage": 3.15, "elapsed_time": "0:01:52", "remaining_time": "0:57:33", "throughput": 6167.23, "total_tokens": 693664} {"current_steps": 1075, "total_steps": 33920, "loss": 0.8149, "lr": 3.1662735849056607e-06, "epoch": 0.6338443396226415, "percentage": 3.17, "elapsed_time": "0:01:53", "remaining_time": "0:57:34", "throughput": 6170.53, "total_tokens": 697696} {"current_steps": 1080, "total_steps": 33920, "loss": 0.6523, "lr": 3.181014150943397e-06, "epoch": 0.6367924528301887, "percentage": 3.18, "elapsed_time": "0:01:53", "remaining_time": "0:57:32", "throughput": 6168.83, "total_tokens": 700480} {"current_steps": 1085, "total_steps": 33920, "loss": 0.6243, "lr": 3.1957547169811327e-06, "epoch": 0.6397405660377359, "percentage": 3.2, "elapsed_time": "0:01:54", "remaining_time": "0:57:33", "throughput": 6170.69, "total_tokens": 704096} {"current_steps": 1090, "total_steps": 33920, "loss": 0.6165, "lr": 3.210495283018868e-06, "epoch": 0.6426886792452831, "percentage": 3.21, "elapsed_time": "0:01:54", "remaining_time": "0:57:30", "throughput": 6168.59, "total_tokens": 706720} {"current_steps": 1095, "total_steps": 33920, "loss": 0.7694, "lr": 3.225235849056604e-06, "epoch": 0.6456367924528302, "percentage": 3.23, "elapsed_time": "0:01:55", "remaining_time": "0:57:28", "throughput": 6167.1, "total_tokens": 709536} {"current_steps": 1100, "total_steps": 33920, "loss": 0.7433, "lr": 3.2399764150943396e-06, "epoch": 0.6485849056603774, "percentage": 3.24, "elapsed_time": "0:01:55", "remaining_time": "0:57:29", "throughput": 6168.39, "total_tokens": 713152} {"current_steps": 1105, "total_steps": 33920, "loss": 0.7226, "lr": 3.2547169811320758e-06, "epoch": 0.6515330188679245, "percentage": 3.26, "elapsed_time": "0:01:56", "remaining_time": "0:57:28", "throughput": 6167.73, "total_tokens": 716160} {"current_steps": 1110, "total_steps": 33920, "loss": 0.6081, "lr": 3.2694575471698115e-06, "epoch": 0.6544811320754716, "percentage": 3.27, "elapsed_time": "0:01:56", "remaining_time": "0:57:26", "throughput": 6167.26, "total_tokens": 719168} {"current_steps": 1115, "total_steps": 33920, "loss": 0.5957, "lr": 3.2841981132075473e-06, "epoch": 0.6574292452830188, "percentage": 3.29, "elapsed_time": "0:01:57", "remaining_time": "0:57:28", "throughput": 6168.08, "total_tokens": 722944} {"current_steps": 1120, "total_steps": 33920, "loss": 0.7109, "lr": 3.298938679245283e-06, "epoch": 0.660377358490566, "percentage": 3.3, "elapsed_time": "0:01:57", "remaining_time": "0:57:30", "throughput": 6168.87, "total_tokens": 726912} {"current_steps": 1125, "total_steps": 33920, "loss": 0.6351, "lr": 3.3136792452830192e-06, "epoch": 0.6633254716981132, "percentage": 3.32, "elapsed_time": "0:01:58", "remaining_time": "0:57:32", "throughput": 6170.15, "total_tokens": 730688} {"current_steps": 1130, "total_steps": 33920, "loss": 0.7068, "lr": 3.328419811320755e-06, "epoch": 0.6662735849056604, "percentage": 3.33, "elapsed_time": "0:01:59", "remaining_time": "0:57:33", "throughput": 6172.66, "total_tokens": 734656} {"current_steps": 1135, "total_steps": 33920, "loss": 0.7861, "lr": 3.3431603773584908e-06, "epoch": 0.6692216981132075, "percentage": 3.35, "elapsed_time": "0:01:59", "remaining_time": "0:57:31", "throughput": 6171.53, "total_tokens": 737408} {"current_steps": 1140, "total_steps": 33920, "loss": 0.5272, "lr": 3.3579009433962266e-06, "epoch": 0.6721698113207547, "percentage": 3.36, "elapsed_time": "0:01:59", "remaining_time": "0:57:29", "throughput": 6170.52, "total_tokens": 740224} {"current_steps": 1145, "total_steps": 33920, "loss": 0.5752, "lr": 3.3726415094339627e-06, "epoch": 0.6751179245283019, "percentage": 3.38, "elapsed_time": "0:02:00", "remaining_time": "0:57:26", "throughput": 6167.87, "total_tokens": 742688} {"current_steps": 1150, "total_steps": 33920, "loss": 0.6491, "lr": 3.3873820754716985e-06, "epoch": 0.6780660377358491, "percentage": 3.39, "elapsed_time": "0:02:00", "remaining_time": "0:57:25", "throughput": 6168.18, "total_tokens": 745728} {"current_steps": 1155, "total_steps": 33920, "loss": 0.586, "lr": 3.4021226415094343e-06, "epoch": 0.6810141509433962, "percentage": 3.41, "elapsed_time": "0:02:01", "remaining_time": "0:57:27", "throughput": 6171.7, "total_tokens": 749984} {"current_steps": 1160, "total_steps": 33920, "loss": 0.6162, "lr": 3.4168632075471705e-06, "epoch": 0.6839622641509434, "percentage": 3.42, "elapsed_time": "0:02:02", "remaining_time": "0:57:26", "throughput": 6173.53, "total_tokens": 753408} {"current_steps": 1165, "total_steps": 33920, "loss": 0.6239, "lr": 3.4316037735849062e-06, "epoch": 0.6869103773584906, "percentage": 3.43, "elapsed_time": "0:02:02", "remaining_time": "0:57:24", "throughput": 6171.2, "total_tokens": 755936} {"current_steps": 1170, "total_steps": 33920, "loss": 0.6231, "lr": 3.446344339622642e-06, "epoch": 0.6898584905660378, "percentage": 3.45, "elapsed_time": "0:02:02", "remaining_time": "0:57:22", "throughput": 6173.05, "total_tokens": 759264} {"current_steps": 1175, "total_steps": 33920, "loss": 0.5357, "lr": 3.4610849056603778e-06, "epoch": 0.6928066037735849, "percentage": 3.46, "elapsed_time": "0:02:03", "remaining_time": "0:57:23", "throughput": 6175.13, "total_tokens": 762976} {"current_steps": 1180, "total_steps": 33920, "loss": 0.5106, "lr": 3.475825471698113e-06, "epoch": 0.6957547169811321, "percentage": 3.48, "elapsed_time": "0:02:04", "remaining_time": "0:57:21", "throughput": 6174.2, "total_tokens": 765888} {"current_steps": 1185, "total_steps": 33920, "loss": 0.6496, "lr": 3.4905660377358493e-06, "epoch": 0.6987028301886793, "percentage": 3.49, "elapsed_time": "0:02:04", "remaining_time": "0:57:20", "throughput": 6175.21, "total_tokens": 769120} {"current_steps": 1190, "total_steps": 33920, "loss": 0.6433, "lr": 3.505306603773585e-06, "epoch": 0.7016509433962265, "percentage": 3.51, "elapsed_time": "0:02:05", "remaining_time": "0:57:20", "throughput": 6177.59, "total_tokens": 772704} {"current_steps": 1195, "total_steps": 33920, "loss": 0.6652, "lr": 3.520047169811321e-06, "epoch": 0.7045990566037735, "percentage": 3.52, "elapsed_time": "0:02:05", "remaining_time": "0:57:17", "throughput": 6177.42, "total_tokens": 775328} {"current_steps": 1200, "total_steps": 33920, "loss": 0.6089, "lr": 3.5347877358490566e-06, "epoch": 0.7075471698113207, "percentage": 3.54, "elapsed_time": "0:02:05", "remaining_time": "0:57:14", "throughput": 6176.79, "total_tokens": 778048} {"current_steps": 1205, "total_steps": 33920, "loss": 0.6877, "lr": 3.549528301886793e-06, "epoch": 0.7104952830188679, "percentage": 3.55, "elapsed_time": "0:02:06", "remaining_time": "0:57:14", "throughput": 6179.46, "total_tokens": 781792} {"current_steps": 1210, "total_steps": 33920, "loss": 0.6718, "lr": 3.5642688679245286e-06, "epoch": 0.7134433962264151, "percentage": 3.57, "elapsed_time": "0:02:06", "remaining_time": "0:57:11", "throughput": 6177.1, "total_tokens": 784000} {"current_steps": 1215, "total_steps": 33920, "loss": 0.7184, "lr": 3.5790094339622643e-06, "epoch": 0.7163915094339622, "percentage": 3.58, "elapsed_time": "0:02:07", "remaining_time": "0:57:13", "throughput": 6179.61, "total_tokens": 788256} {"current_steps": 1220, "total_steps": 33920, "loss": 0.6878, "lr": 3.59375e-06, "epoch": 0.7193396226415094, "percentage": 3.6, "elapsed_time": "0:02:08", "remaining_time": "0:57:13", "throughput": 6180.59, "total_tokens": 791648} {"current_steps": 1225, "total_steps": 33920, "loss": 0.5438, "lr": 3.6084905660377363e-06, "epoch": 0.7222877358490566, "percentage": 3.61, "elapsed_time": "0:02:08", "remaining_time": "0:57:15", "throughput": 6183.72, "total_tokens": 795872} {"current_steps": 1230, "total_steps": 33920, "loss": 0.6473, "lr": 3.623231132075472e-06, "epoch": 0.7252358490566038, "percentage": 3.63, "elapsed_time": "0:02:09", "remaining_time": "0:57:13", "throughput": 6182.18, "total_tokens": 798752} {"current_steps": 1235, "total_steps": 33920, "loss": 0.6027, "lr": 3.637971698113208e-06, "epoch": 0.7281839622641509, "percentage": 3.64, "elapsed_time": "0:02:09", "remaining_time": "0:57:13", "throughput": 6182.55, "total_tokens": 802048} {"current_steps": 1240, "total_steps": 33920, "loss": 0.65, "lr": 3.652712264150944e-06, "epoch": 0.7311320754716981, "percentage": 3.66, "elapsed_time": "0:02:10", "remaining_time": "0:57:11", "throughput": 6181.42, "total_tokens": 804768} {"current_steps": 1245, "total_steps": 33920, "loss": 0.6283, "lr": 3.66745283018868e-06, "epoch": 0.7340801886792453, "percentage": 3.67, "elapsed_time": "0:02:10", "remaining_time": "0:57:12", "throughput": 6184.13, "total_tokens": 808896} {"current_steps": 1250, "total_steps": 33920, "loss": 0.6092, "lr": 3.6821933962264156e-06, "epoch": 0.7370283018867925, "percentage": 3.69, "elapsed_time": "0:02:11", "remaining_time": "0:57:12", "throughput": 6185.74, "total_tokens": 812288} {"current_steps": 1255, "total_steps": 33920, "loss": 0.6638, "lr": 3.6969339622641513e-06, "epoch": 0.7399764150943396, "percentage": 3.7, "elapsed_time": "0:02:11", "remaining_time": "0:57:12", "throughput": 6186.68, "total_tokens": 815840} {"current_steps": 1260, "total_steps": 33920, "loss": 0.5759, "lr": 3.7116745283018875e-06, "epoch": 0.7429245283018868, "percentage": 3.71, "elapsed_time": "0:02:12", "remaining_time": "0:57:12", "throughput": 6186.21, "total_tokens": 819168} {"current_steps": 1265, "total_steps": 33920, "loss": 0.4967, "lr": 3.726415094339623e-06, "epoch": 0.745872641509434, "percentage": 3.73, "elapsed_time": "0:02:13", "remaining_time": "0:57:13", "throughput": 6186.52, "total_tokens": 822944} {"current_steps": 1270, "total_steps": 33920, "loss": 0.6567, "lr": 3.7411556603773586e-06, "epoch": 0.7488207547169812, "percentage": 3.74, "elapsed_time": "0:02:13", "remaining_time": "0:57:13", "throughput": 6187.33, "total_tokens": 826272} {"current_steps": 1275, "total_steps": 33920, "loss": 0.585, "lr": 3.7558962264150944e-06, "epoch": 0.7517688679245284, "percentage": 3.76, "elapsed_time": "0:02:14", "remaining_time": "0:57:13", "throughput": 6190.01, "total_tokens": 830144} {"current_steps": 1280, "total_steps": 33920, "loss": 0.6279, "lr": 3.77063679245283e-06, "epoch": 0.7547169811320755, "percentage": 3.77, "elapsed_time": "0:02:14", "remaining_time": "0:57:12", "throughput": 6188.9, "total_tokens": 832960} {"current_steps": 1285, "total_steps": 33920, "loss": 0.6032, "lr": 3.7853773584905664e-06, "epoch": 0.7576650943396226, "percentage": 3.79, "elapsed_time": "0:02:15", "remaining_time": "0:57:09", "throughput": 6186.72, "total_tokens": 835392} {"current_steps": 1290, "total_steps": 33920, "loss": 0.5209, "lr": 3.800117924528302e-06, "epoch": 0.7606132075471698, "percentage": 3.8, "elapsed_time": "0:02:15", "remaining_time": "0:57:08", "throughput": 6186.81, "total_tokens": 838592} {"current_steps": 1295, "total_steps": 33920, "loss": 0.4959, "lr": 3.814858490566038e-06, "epoch": 0.7635613207547169, "percentage": 3.82, "elapsed_time": "0:02:16", "remaining_time": "0:57:07", "throughput": 6188.06, "total_tokens": 841824} {"current_steps": 1300, "total_steps": 33920, "loss": 0.5725, "lr": 3.829599056603774e-06, "epoch": 0.7665094339622641, "percentage": 3.83, "elapsed_time": "0:02:16", "remaining_time": "0:57:08", "throughput": 6189.12, "total_tokens": 845760} {"current_steps": 1305, "total_steps": 33920, "loss": 0.8529, "lr": 3.8443396226415094e-06, "epoch": 0.7694575471698113, "percentage": 3.85, "elapsed_time": "0:02:17", "remaining_time": "0:57:19", "throughput": 6193.82, "total_tokens": 852288} {"current_steps": 1310, "total_steps": 33920, "loss": 0.553, "lr": 3.859080188679246e-06, "epoch": 0.7724056603773585, "percentage": 3.86, "elapsed_time": "0:02:18", "remaining_time": "0:57:16", "throughput": 6193.13, "total_tokens": 855008} {"current_steps": 1315, "total_steps": 33920, "loss": 0.5266, "lr": 3.873820754716982e-06, "epoch": 0.7753537735849056, "percentage": 3.88, "elapsed_time": "0:02:18", "remaining_time": "0:57:14", "throughput": 6191.94, "total_tokens": 857728} {"current_steps": 1320, "total_steps": 33920, "loss": 0.5665, "lr": 3.888561320754717e-06, "epoch": 0.7783018867924528, "percentage": 3.89, "elapsed_time": "0:02:19", "remaining_time": "0:57:14", "throughput": 6194.37, "total_tokens": 861472} {"current_steps": 1325, "total_steps": 33920, "loss": 0.6286, "lr": 3.903301886792453e-06, "epoch": 0.78125, "percentage": 3.91, "elapsed_time": "0:02:19", "remaining_time": "0:57:16", "throughput": 6196.87, "total_tokens": 865568} {"current_steps": 1330, "total_steps": 33920, "loss": 0.7196, "lr": 3.9180424528301895e-06, "epoch": 0.7841981132075472, "percentage": 3.92, "elapsed_time": "0:02:20", "remaining_time": "0:57:15", "throughput": 6197.45, "total_tokens": 868928} {"current_steps": 1335, "total_steps": 33920, "loss": 0.4917, "lr": 3.932783018867925e-06, "epoch": 0.7871462264150944, "percentage": 3.94, "elapsed_time": "0:02:20", "remaining_time": "0:57:14", "throughput": 6197.56, "total_tokens": 872096} {"current_steps": 1340, "total_steps": 33920, "loss": 0.434, "lr": 3.947523584905661e-06, "epoch": 0.7900943396226415, "percentage": 3.95, "elapsed_time": "0:02:21", "remaining_time": "0:57:14", "throughput": 6197.11, "total_tokens": 875296} {"current_steps": 1345, "total_steps": 33920, "loss": 0.5318, "lr": 3.962264150943396e-06, "epoch": 0.7930424528301887, "percentage": 3.97, "elapsed_time": "0:02:21", "remaining_time": "0:57:12", "throughput": 6196.72, "total_tokens": 878144} {"current_steps": 1350, "total_steps": 33920, "loss": 0.7072, "lr": 3.977004716981133e-06, "epoch": 0.7959905660377359, "percentage": 3.98, "elapsed_time": "0:02:22", "remaining_time": "0:57:10", "throughput": 6195.81, "total_tokens": 880928} {"current_steps": 1355, "total_steps": 33920, "loss": 0.5436, "lr": 3.991745283018868e-06, "epoch": 0.7989386792452831, "percentage": 3.99, "elapsed_time": "0:02:22", "remaining_time": "0:57:08", "throughput": 6194.89, "total_tokens": 883680} {"current_steps": 1360, "total_steps": 33920, "loss": 0.7083, "lr": 4.006485849056604e-06, "epoch": 0.8018867924528302, "percentage": 4.01, "elapsed_time": "0:02:23", "remaining_time": "0:57:06", "throughput": 6193.61, "total_tokens": 886368} {"current_steps": 1365, "total_steps": 33920, "loss": 0.7309, "lr": 4.0212264150943395e-06, "epoch": 0.8048349056603774, "percentage": 4.02, "elapsed_time": "0:02:23", "remaining_time": "0:57:05", "throughput": 6194.01, "total_tokens": 889728} {"current_steps": 1370, "total_steps": 33920, "loss": 0.5954, "lr": 4.035966981132076e-06, "epoch": 0.8077830188679245, "percentage": 4.04, "elapsed_time": "0:02:24", "remaining_time": "0:57:05", "throughput": 6194.41, "total_tokens": 892992} {"current_steps": 1375, "total_steps": 33920, "loss": 0.6435, "lr": 4.050707547169812e-06, "epoch": 0.8107311320754716, "percentage": 4.05, "elapsed_time": "0:02:24", "remaining_time": "0:57:03", "throughput": 6192.96, "total_tokens": 895712} {"current_steps": 1380, "total_steps": 33920, "loss": 0.6819, "lr": 4.065448113207547e-06, "epoch": 0.8136792452830188, "percentage": 4.07, "elapsed_time": "0:02:25", "remaining_time": "0:57:01", "throughput": 6192.17, "total_tokens": 898400} {"current_steps": 1385, "total_steps": 33920, "loss": 0.5789, "lr": 4.080188679245283e-06, "epoch": 0.816627358490566, "percentage": 4.08, "elapsed_time": "0:02:25", "remaining_time": "0:56:59", "throughput": 6192.21, "total_tokens": 901440} {"current_steps": 1390, "total_steps": 33920, "loss": 0.6054, "lr": 4.094929245283019e-06, "epoch": 0.8195754716981132, "percentage": 4.1, "elapsed_time": "0:02:26", "remaining_time": "0:56:58", "throughput": 6191.16, "total_tokens": 904288} {"current_steps": 1395, "total_steps": 33920, "loss": 0.5652, "lr": 4.109669811320755e-06, "epoch": 0.8225235849056604, "percentage": 4.11, "elapsed_time": "0:02:26", "remaining_time": "0:56:58", "throughput": 6191.45, "total_tokens": 907776} {"current_steps": 1400, "total_steps": 33920, "loss": 0.6495, "lr": 4.124410377358491e-06, "epoch": 0.8254716981132075, "percentage": 4.13, "elapsed_time": "0:02:27", "remaining_time": "0:56:59", "throughput": 6192.96, "total_tokens": 911584} {"current_steps": 1405, "total_steps": 33920, "loss": 0.5128, "lr": 4.1391509433962265e-06, "epoch": 0.8284198113207547, "percentage": 4.14, "elapsed_time": "0:02:27", "remaining_time": "0:56:59", "throughput": 6193.71, "total_tokens": 915232} {"current_steps": 1410, "total_steps": 33920, "loss": 0.5075, "lr": 4.153891509433963e-06, "epoch": 0.8313679245283019, "percentage": 4.16, "elapsed_time": "0:02:28", "remaining_time": "0:56:58", "throughput": 6190.33, "total_tokens": 917696} {"current_steps": 1415, "total_steps": 33920, "loss": 0.7284, "lr": 4.168632075471699e-06, "epoch": 0.8343160377358491, "percentage": 4.17, "elapsed_time": "0:02:28", "remaining_time": "0:57:01", "throughput": 6193.84, "total_tokens": 922656} {"current_steps": 1420, "total_steps": 33920, "loss": 0.4272, "lr": 4.183372641509434e-06, "epoch": 0.8372641509433962, "percentage": 4.19, "elapsed_time": "0:02:29", "remaining_time": "0:57:01", "throughput": 6193.73, "total_tokens": 925856} {"current_steps": 1425, "total_steps": 33920, "loss": 0.661, "lr": 4.19811320754717e-06, "epoch": 0.8402122641509434, "percentage": 4.2, "elapsed_time": "0:02:30", "remaining_time": "0:57:02", "throughput": 6197.02, "total_tokens": 930176} {"current_steps": 1430, "total_steps": 33920, "loss": 0.6749, "lr": 4.212853773584907e-06, "epoch": 0.8431603773584906, "percentage": 4.22, "elapsed_time": "0:02:30", "remaining_time": "0:57:01", "throughput": 6197.88, "total_tokens": 933472} {"current_steps": 1435, "total_steps": 33920, "loss": 0.5572, "lr": 4.227594339622642e-06, "epoch": 0.8461084905660378, "percentage": 4.23, "elapsed_time": "0:02:31", "remaining_time": "0:57:00", "throughput": 6197.7, "total_tokens": 936416} {"current_steps": 1440, "total_steps": 33920, "loss": 0.6833, "lr": 4.242334905660378e-06, "epoch": 0.8490566037735849, "percentage": 4.25, "elapsed_time": "0:02:31", "remaining_time": "0:56:58", "throughput": 6196.94, "total_tokens": 939136} {"current_steps": 1445, "total_steps": 33920, "loss": 0.6223, "lr": 4.2570754716981135e-06, "epoch": 0.8520047169811321, "percentage": 4.26, "elapsed_time": "0:02:32", "remaining_time": "0:57:00", "throughput": 6197.68, "total_tokens": 943168} {"current_steps": 1450, "total_steps": 33920, "loss": 0.5195, "lr": 4.271816037735849e-06, "epoch": 0.8549528301886793, "percentage": 4.27, "elapsed_time": "0:02:32", "remaining_time": "0:56:57", "throughput": 6195.31, "total_tokens": 945568} {"current_steps": 1455, "total_steps": 33920, "loss": 0.5574, "lr": 4.286556603773585e-06, "epoch": 0.8579009433962265, "percentage": 4.29, "elapsed_time": "0:02:33", "remaining_time": "0:56:55", "throughput": 6194.95, "total_tokens": 948416} {"current_steps": 1460, "total_steps": 33920, "loss": 0.5297, "lr": 4.301297169811321e-06, "epoch": 0.8608490566037735, "percentage": 4.3, "elapsed_time": "0:02:33", "remaining_time": "0:56:54", "throughput": 6192.37, "total_tokens": 950880} {"current_steps": 1465, "total_steps": 33920, "loss": 0.5256, "lr": 4.3160377358490565e-06, "epoch": 0.8637971698113207, "percentage": 4.32, "elapsed_time": "0:02:34", "remaining_time": "0:56:52", "throughput": 6191.78, "total_tokens": 953632} {"current_steps": 1470, "total_steps": 33920, "loss": 0.6593, "lr": 4.330778301886793e-06, "epoch": 0.8667452830188679, "percentage": 4.33, "elapsed_time": "0:02:34", "remaining_time": "0:56:50", "throughput": 6190.1, "total_tokens": 956320} {"current_steps": 1475, "total_steps": 33920, "loss": 0.6287, "lr": 4.345518867924529e-06, "epoch": 0.8696933962264151, "percentage": 4.35, "elapsed_time": "0:02:35", "remaining_time": "0:56:49", "throughput": 6191.33, "total_tokens": 959712} {"current_steps": 1480, "total_steps": 33920, "loss": 0.5644, "lr": 4.360259433962264e-06, "epoch": 0.8726415094339622, "percentage": 4.36, "elapsed_time": "0:02:35", "remaining_time": "0:56:49", "throughput": 6192.94, "total_tokens": 963264} {"current_steps": 1485, "total_steps": 33920, "loss": 0.5753, "lr": 4.3750000000000005e-06, "epoch": 0.8755896226415094, "percentage": 4.38, "elapsed_time": "0:02:36", "remaining_time": "0:56:50", "throughput": 6194.98, "total_tokens": 967424} {"current_steps": 1490, "total_steps": 33920, "loss": 0.5454, "lr": 4.389740566037737e-06, "epoch": 0.8785377358490566, "percentage": 4.39, "elapsed_time": "0:02:37", "remaining_time": "0:57:02", "throughput": 6197.81, "total_tokens": 974592} {"current_steps": 1495, "total_steps": 33920, "loss": 0.6659, "lr": 4.404481132075472e-06, "epoch": 0.8814858490566038, "percentage": 4.41, "elapsed_time": "0:02:37", "remaining_time": "0:57:03", "throughput": 6200.4, "total_tokens": 978784} {"current_steps": 1500, "total_steps": 33920, "loss": 0.5154, "lr": 4.419221698113208e-06, "epoch": 0.8844339622641509, "percentage": 4.42, "elapsed_time": "0:02:38", "remaining_time": "0:57:02", "throughput": 6200.08, "total_tokens": 981696} {"current_steps": 1505, "total_steps": 33920, "loss": 0.6376, "lr": 4.4339622641509435e-06, "epoch": 0.8873820754716981, "percentage": 4.44, "elapsed_time": "0:02:38", "remaining_time": "0:57:02", "throughput": 6201.13, "total_tokens": 985408} {"current_steps": 1510, "total_steps": 33920, "loss": 0.6862, "lr": 4.44870283018868e-06, "epoch": 0.8903301886792453, "percentage": 4.45, "elapsed_time": "0:02:39", "remaining_time": "0:57:01", "throughput": 6201.92, "total_tokens": 988576} {"current_steps": 1515, "total_steps": 33920, "loss": 0.59, "lr": 4.463443396226416e-06, "epoch": 0.8932783018867925, "percentage": 4.47, "elapsed_time": "0:02:39", "remaining_time": "0:57:00", "throughput": 6203.03, "total_tokens": 991840} {"current_steps": 1520, "total_steps": 33920, "loss": 0.6499, "lr": 4.478183962264151e-06, "epoch": 0.8962264150943396, "percentage": 4.48, "elapsed_time": "0:02:40", "remaining_time": "0:56:59", "throughput": 6203.64, "total_tokens": 995200} {"current_steps": 1525, "total_steps": 33920, "loss": 0.6689, "lr": 4.4929245283018875e-06, "epoch": 0.8991745283018868, "percentage": 4.5, "elapsed_time": "0:02:40", "remaining_time": "0:56:59", "throughput": 6204.68, "total_tokens": 998912} {"current_steps": 1530, "total_steps": 33920, "loss": 0.5739, "lr": 4.507665094339623e-06, "epoch": 0.902122641509434, "percentage": 4.51, "elapsed_time": "0:02:41", "remaining_time": "0:57:00", "throughput": 6206.28, "total_tokens": 1002848} {"current_steps": 1535, "total_steps": 33920, "loss": 0.6967, "lr": 4.522405660377359e-06, "epoch": 0.9050707547169812, "percentage": 4.53, "elapsed_time": "0:02:42", "remaining_time": "0:56:59", "throughput": 6202.88, "total_tokens": 1005312} {"current_steps": 1540, "total_steps": 33920, "loss": 0.5949, "lr": 4.537146226415094e-06, "epoch": 0.9080188679245284, "percentage": 4.54, "elapsed_time": "0:02:42", "remaining_time": "0:56:58", "throughput": 6203.95, "total_tokens": 1008576} {"current_steps": 1545, "total_steps": 33920, "loss": 0.6176, "lr": 4.5518867924528305e-06, "epoch": 0.9109669811320755, "percentage": 4.55, "elapsed_time": "0:02:43", "remaining_time": "0:56:59", "throughput": 6206.01, "total_tokens": 1012736} {"current_steps": 1550, "total_steps": 33920, "loss": 0.5534, "lr": 4.566627358490566e-06, "epoch": 0.9139150943396226, "percentage": 4.57, "elapsed_time": "0:02:43", "remaining_time": "0:56:59", "throughput": 6207.73, "total_tokens": 1016320} {"current_steps": 1555, "total_steps": 33920, "loss": 0.6508, "lr": 4.581367924528302e-06, "epoch": 0.9168632075471698, "percentage": 4.58, "elapsed_time": "0:02:44", "remaining_time": "0:56:57", "throughput": 6207.96, "total_tokens": 1019392} {"current_steps": 1560, "total_steps": 33920, "loss": 0.4678, "lr": 4.596108490566038e-06, "epoch": 0.9198113207547169, "percentage": 4.6, "elapsed_time": "0:02:44", "remaining_time": "0:56:55", "throughput": 6207.47, "total_tokens": 1022080} {"current_steps": 1565, "total_steps": 33920, "loss": 0.5864, "lr": 4.610849056603774e-06, "epoch": 0.9227594339622641, "percentage": 4.61, "elapsed_time": "0:02:45", "remaining_time": "0:56:53", "throughput": 6206.87, "total_tokens": 1024960} {"current_steps": 1570, "total_steps": 33920, "loss": 0.6301, "lr": 4.62558962264151e-06, "epoch": 0.9257075471698113, "percentage": 4.63, "elapsed_time": "0:02:45", "remaining_time": "0:56:53", "throughput": 6208.31, "total_tokens": 1028480} {"current_steps": 1575, "total_steps": 33920, "loss": 0.5089, "lr": 4.640330188679246e-06, "epoch": 0.9286556603773585, "percentage": 4.64, "elapsed_time": "0:02:46", "remaining_time": "0:56:52", "throughput": 6206.97, "total_tokens": 1031328} {"current_steps": 1580, "total_steps": 33920, "loss": 0.4194, "lr": 4.655070754716981e-06, "epoch": 0.9316037735849056, "percentage": 4.66, "elapsed_time": "0:02:46", "remaining_time": "0:56:50", "throughput": 6205.33, "total_tokens": 1034048} {"current_steps": 1585, "total_steps": 33920, "loss": 0.5023, "lr": 4.6698113207547175e-06, "epoch": 0.9345518867924528, "percentage": 4.67, "elapsed_time": "0:02:47", "remaining_time": "0:56:49", "throughput": 6205.17, "total_tokens": 1037024} {"current_steps": 1590, "total_steps": 33920, "loss": 0.5958, "lr": 4.684551886792454e-06, "epoch": 0.9375, "percentage": 4.69, "elapsed_time": "0:02:47", "remaining_time": "0:56:48", "throughput": 6205.54, "total_tokens": 1040128} {"current_steps": 1595, "total_steps": 33920, "loss": 0.5879, "lr": 4.699292452830189e-06, "epoch": 0.9404481132075472, "percentage": 4.7, "elapsed_time": "0:02:48", "remaining_time": "0:56:47", "throughput": 6205.61, "total_tokens": 1043328} {"current_steps": 1600, "total_steps": 33920, "loss": 0.5938, "lr": 4.714033018867925e-06, "epoch": 0.9433962264150944, "percentage": 4.72, "elapsed_time": "0:02:48", "remaining_time": "0:56:45", "throughput": 6205.21, "total_tokens": 1046176} {"current_steps": 1605, "total_steps": 33920, "loss": 0.6332, "lr": 4.728773584905661e-06, "epoch": 0.9463443396226415, "percentage": 4.73, "elapsed_time": "0:02:49", "remaining_time": "0:56:43", "throughput": 6204.4, "total_tokens": 1048896} {"current_steps": 1610, "total_steps": 33920, "loss": 0.6347, "lr": 4.743514150943397e-06, "epoch": 0.9492924528301887, "percentage": 4.75, "elapsed_time": "0:02:49", "remaining_time": "0:56:44", "throughput": 6206.12, "total_tokens": 1052768} {"current_steps": 1615, "total_steps": 33920, "loss": 0.5877, "lr": 4.758254716981133e-06, "epoch": 0.9522405660377359, "percentage": 4.76, "elapsed_time": "0:02:50", "remaining_time": "0:56:42", "throughput": 6206.14, "total_tokens": 1055616} {"current_steps": 1620, "total_steps": 33920, "loss": 0.5421, "lr": 4.772995283018868e-06, "epoch": 0.9551886792452831, "percentage": 4.78, "elapsed_time": "0:02:50", "remaining_time": "0:56:41", "throughput": 6207.46, "total_tokens": 1059072} {"current_steps": 1625, "total_steps": 33920, "loss": 0.7592, "lr": 4.787735849056604e-06, "epoch": 0.9581367924528302, "percentage": 4.79, "elapsed_time": "0:02:51", "remaining_time": "0:56:39", "throughput": 6207.52, "total_tokens": 1061920} {"current_steps": 1630, "total_steps": 33920, "loss": 0.581, "lr": 4.80247641509434e-06, "epoch": 0.9610849056603774, "percentage": 4.81, "elapsed_time": "0:02:51", "remaining_time": "0:56:38", "throughput": 6207.57, "total_tokens": 1064896} {"current_steps": 1635, "total_steps": 33920, "loss": 0.6342, "lr": 4.817216981132076e-06, "epoch": 0.9640330188679245, "percentage": 4.82, "elapsed_time": "0:02:52", "remaining_time": "0:56:36", "throughput": 6207.18, "total_tokens": 1067744} {"current_steps": 1640, "total_steps": 33920, "loss": 0.5076, "lr": 4.831957547169811e-06, "epoch": 0.9669811320754716, "percentage": 4.83, "elapsed_time": "0:02:52", "remaining_time": "0:56:35", "throughput": 6207.73, "total_tokens": 1070944} {"current_steps": 1645, "total_steps": 33920, "loss": 0.5585, "lr": 4.8466981132075476e-06, "epoch": 0.9699292452830188, "percentage": 4.85, "elapsed_time": "0:02:53", "remaining_time": "0:56:34", "throughput": 6207.05, "total_tokens": 1073888} {"current_steps": 1650, "total_steps": 33920, "loss": 0.8427, "lr": 4.861438679245283e-06, "epoch": 0.972877358490566, "percentage": 4.86, "elapsed_time": "0:02:53", "remaining_time": "0:56:37", "throughput": 6208.39, "total_tokens": 1078592} {"current_steps": 1655, "total_steps": 33920, "loss": 0.5229, "lr": 4.876179245283019e-06, "epoch": 0.9758254716981132, "percentage": 4.88, "elapsed_time": "0:02:54", "remaining_time": "0:56:37", "throughput": 6209.01, "total_tokens": 1081920} {"current_steps": 1660, "total_steps": 33920, "loss": 0.6266, "lr": 4.890919811320755e-06, "epoch": 0.9787735849056604, "percentage": 4.89, "elapsed_time": "0:02:54", "remaining_time": "0:56:35", "throughput": 6208.43, "total_tokens": 1084800} {"current_steps": 1665, "total_steps": 33920, "loss": 0.5046, "lr": 4.905660377358491e-06, "epoch": 0.9817216981132075, "percentage": 4.91, "elapsed_time": "0:02:55", "remaining_time": "0:56:36", "throughput": 6210.32, "total_tokens": 1088832} {"current_steps": 1670, "total_steps": 33920, "loss": 0.8285, "lr": 4.920400943396227e-06, "epoch": 0.9846698113207547, "percentage": 4.92, "elapsed_time": "0:02:55", "remaining_time": "0:56:36", "throughput": 6211.72, "total_tokens": 1092608} {"current_steps": 1675, "total_steps": 33920, "loss": 0.5754, "lr": 4.935141509433963e-06, "epoch": 0.9876179245283019, "percentage": 4.94, "elapsed_time": "0:02:56", "remaining_time": "0:56:35", "throughput": 6211.74, "total_tokens": 1095776} {"current_steps": 1680, "total_steps": 33920, "loss": 0.4921, "lr": 4.949882075471698e-06, "epoch": 0.9905660377358491, "percentage": 4.95, "elapsed_time": "0:02:56", "remaining_time": "0:56:34", "throughput": 6211.85, "total_tokens": 1098816} {"current_steps": 1685, "total_steps": 33920, "loss": 0.5883, "lr": 4.9646226415094346e-06, "epoch": 0.9935141509433962, "percentage": 4.97, "elapsed_time": "0:02:57", "remaining_time": "0:56:32", "throughput": 6211.72, "total_tokens": 1101664} {"current_steps": 1690, "total_steps": 33920, "loss": 0.5248, "lr": 4.979363207547171e-06, "epoch": 0.9964622641509434, "percentage": 4.98, "elapsed_time": "0:02:57", "remaining_time": "0:56:33", "throughput": 6213.36, "total_tokens": 1105504} {"current_steps": 1695, "total_steps": 33920, "loss": 0.6374, "lr": 4.994103773584906e-06, "epoch": 0.9994103773584906, "percentage": 5.0, "elapsed_time": "0:02:58", "remaining_time": "0:56:32", "throughput": 6214.77, "total_tokens": 1109088} {"current_steps": 1700, "total_steps": 33920, "loss": 0.4929, "lr": 5.0088443396226414e-06, "epoch": 1.0023584905660377, "percentage": 5.01, "elapsed_time": "0:02:59", "remaining_time": "0:56:36", "throughput": 6202.41, "total_tokens": 1111592} {"current_steps": 1705, "total_steps": 33920, "loss": 0.6107, "lr": 5.023584905660378e-06, "epoch": 1.005306603773585, "percentage": 5.03, "elapsed_time": "0:02:59", "remaining_time": "0:56:36", "throughput": 6203.36, "total_tokens": 1115016} {"current_steps": 1710, "total_steps": 33920, "loss": 0.5915, "lr": 5.038325471698113e-06, "epoch": 1.008254716981132, "percentage": 5.04, "elapsed_time": "0:03:00", "remaining_time": "0:56:35", "throughput": 6204.0, "total_tokens": 1118248} {"current_steps": 1715, "total_steps": 33920, "loss": 0.5639, "lr": 5.05306603773585e-06, "epoch": 1.0112028301886793, "percentage": 5.06, "elapsed_time": "0:03:00", "remaining_time": "0:56:36", "throughput": 6204.36, "total_tokens": 1122312} {"current_steps": 1720, "total_steps": 33920, "loss": 0.5197, "lr": 5.067806603773585e-06, "epoch": 1.0141509433962264, "percentage": 5.07, "elapsed_time": "0:03:01", "remaining_time": "0:56:36", "throughput": 6205.37, "total_tokens": 1125736} {"current_steps": 1725, "total_steps": 33920, "loss": 0.4926, "lr": 5.0825471698113216e-06, "epoch": 1.0170990566037736, "percentage": 5.09, "elapsed_time": "0:03:01", "remaining_time": "0:56:33", "throughput": 6203.66, "total_tokens": 1128040} {"current_steps": 1730, "total_steps": 33920, "loss": 0.4927, "lr": 5.097287735849057e-06, "epoch": 1.0200471698113207, "percentage": 5.1, "elapsed_time": "0:03:02", "remaining_time": "0:56:32", "throughput": 6203.91, "total_tokens": 1131176} {"current_steps": 1735, "total_steps": 33920, "loss": 0.5068, "lr": 5.112028301886793e-06, "epoch": 1.022995283018868, "percentage": 5.11, "elapsed_time": "0:03:02", "remaining_time": "0:56:31", "throughput": 6204.81, "total_tokens": 1134504} {"current_steps": 1740, "total_steps": 33920, "loss": 0.4646, "lr": 5.1267688679245284e-06, "epoch": 1.025943396226415, "percentage": 5.13, "elapsed_time": "0:03:03", "remaining_time": "0:56:29", "throughput": 6204.4, "total_tokens": 1137224} {"current_steps": 1745, "total_steps": 33920, "loss": 0.5454, "lr": 5.1415094339622655e-06, "epoch": 1.0288915094339623, "percentage": 5.14, "elapsed_time": "0:03:03", "remaining_time": "0:56:30", "throughput": 6205.84, "total_tokens": 1141160} {"current_steps": 1750, "total_steps": 33920, "loss": 0.4068, "lr": 5.156250000000001e-06, "epoch": 1.0318396226415094, "percentage": 5.16, "elapsed_time": "0:03:04", "remaining_time": "0:56:30", "throughput": 6207.1, "total_tokens": 1144840} {"current_steps": 1755, "total_steps": 33920, "loss": 0.7379, "lr": 5.170990566037736e-06, "epoch": 1.0347877358490567, "percentage": 5.17, "elapsed_time": "0:03:04", "remaining_time": "0:56:29", "throughput": 6206.44, "total_tokens": 1147688} {"current_steps": 1760, "total_steps": 33920, "loss": 0.6728, "lr": 5.185731132075472e-06, "epoch": 1.0377358490566038, "percentage": 5.19, "elapsed_time": "0:03:05", "remaining_time": "0:56:28", "throughput": 6207.02, "total_tokens": 1151144} {"current_steps": 1765, "total_steps": 33920, "loss": 0.5028, "lr": 5.200471698113208e-06, "epoch": 1.040683962264151, "percentage": 5.2, "elapsed_time": "0:03:05", "remaining_time": "0:56:27", "throughput": 6204.78, "total_tokens": 1153576} {"current_steps": 1770, "total_steps": 33920, "loss": 0.606, "lr": 5.215212264150944e-06, "epoch": 1.0436320754716981, "percentage": 5.22, "elapsed_time": "0:03:06", "remaining_time": "0:56:25", "throughput": 6204.98, "total_tokens": 1156520} {"current_steps": 1775, "total_steps": 33920, "loss": 0.727, "lr": 5.229952830188679e-06, "epoch": 1.0465801886792452, "percentage": 5.23, "elapsed_time": "0:03:06", "remaining_time": "0:56:23", "throughput": 6203.58, "total_tokens": 1159112} {"current_steps": 1780, "total_steps": 33920, "loss": 0.6011, "lr": 5.2446933962264154e-06, "epoch": 1.0495283018867925, "percentage": 5.25, "elapsed_time": "0:03:07", "remaining_time": "0:56:23", "throughput": 6204.28, "total_tokens": 1162696} {"current_steps": 1785, "total_steps": 33920, "loss": 0.4691, "lr": 5.259433962264151e-06, "epoch": 1.0524764150943395, "percentage": 5.26, "elapsed_time": "0:03:07", "remaining_time": "0:56:23", "throughput": 6205.06, "total_tokens": 1166216} {"current_steps": 1790, "total_steps": 33920, "loss": 0.6155, "lr": 5.274174528301888e-06, "epoch": 1.0554245283018868, "percentage": 5.28, "elapsed_time": "0:03:08", "remaining_time": "0:56:22", "throughput": 6206.39, "total_tokens": 1169704} {"current_steps": 1795, "total_steps": 33920, "loss": 0.5914, "lr": 5.288915094339623e-06, "epoch": 1.0583726415094339, "percentage": 5.29, "elapsed_time": "0:03:09", "remaining_time": "0:56:22", "throughput": 6206.16, "total_tokens": 1172968} {"current_steps": 1800, "total_steps": 33920, "loss": 0.6862, "lr": 5.303655660377359e-06, "epoch": 1.0613207547169812, "percentage": 5.31, "elapsed_time": "0:03:09", "remaining_time": "0:56:22", "throughput": 6207.97, "total_tokens": 1176872} {"current_steps": 1805, "total_steps": 33920, "loss": 0.4426, "lr": 5.318396226415095e-06, "epoch": 1.0642688679245282, "percentage": 5.32, "elapsed_time": "0:03:10", "remaining_time": "0:56:20", "throughput": 6206.57, "total_tokens": 1179304} {"current_steps": 1810, "total_steps": 33920, "loss": 0.4884, "lr": 5.333136792452831e-06, "epoch": 1.0672169811320755, "percentage": 5.34, "elapsed_time": "0:03:10", "remaining_time": "0:56:19", "throughput": 6206.32, "total_tokens": 1182408} {"current_steps": 1815, "total_steps": 33920, "loss": 0.4798, "lr": 5.347877358490566e-06, "epoch": 1.0701650943396226, "percentage": 5.35, "elapsed_time": "0:03:11", "remaining_time": "0:56:18", "throughput": 6205.99, "total_tokens": 1185384} {"current_steps": 1820, "total_steps": 33920, "loss": 0.6003, "lr": 5.362617924528302e-06, "epoch": 1.0731132075471699, "percentage": 5.37, "elapsed_time": "0:03:11", "remaining_time": "0:56:17", "throughput": 6205.83, "total_tokens": 1188392} {"current_steps": 1825, "total_steps": 33920, "loss": 0.5613, "lr": 5.377358490566038e-06, "epoch": 1.076061320754717, "percentage": 5.38, "elapsed_time": "0:03:12", "remaining_time": "0:56:18", "throughput": 6206.65, "total_tokens": 1192264} {"current_steps": 1830, "total_steps": 33920, "loss": 0.5039, "lr": 5.392099056603775e-06, "epoch": 1.0790094339622642, "percentage": 5.4, "elapsed_time": "0:03:12", "remaining_time": "0:56:17", "throughput": 6206.73, "total_tokens": 1195592} {"current_steps": 1835, "total_steps": 33920, "loss": 0.7268, "lr": 5.40683962264151e-06, "epoch": 1.0819575471698113, "percentage": 5.41, "elapsed_time": "0:03:13", "remaining_time": "0:56:16", "throughput": 6204.74, "total_tokens": 1198216} {"current_steps": 1840, "total_steps": 33920, "loss": 0.491, "lr": 5.4215801886792455e-06, "epoch": 1.0849056603773586, "percentage": 5.42, "elapsed_time": "0:03:13", "remaining_time": "0:56:15", "throughput": 6204.58, "total_tokens": 1201224} {"current_steps": 1845, "total_steps": 33920, "loss": 0.5731, "lr": 5.436320754716982e-06, "epoch": 1.0878537735849056, "percentage": 5.44, "elapsed_time": "0:03:14", "remaining_time": "0:56:14", "throughput": 6204.81, "total_tokens": 1204232} {"current_steps": 1850, "total_steps": 33920, "loss": 0.611, "lr": 5.451061320754717e-06, "epoch": 1.0908018867924527, "percentage": 5.45, "elapsed_time": "0:03:14", "remaining_time": "0:56:13", "throughput": 6205.94, "total_tokens": 1207624} {"current_steps": 1855, "total_steps": 33920, "loss": 0.5949, "lr": 5.465801886792453e-06, "epoch": 1.09375, "percentage": 5.47, "elapsed_time": "0:03:15", "remaining_time": "0:56:12", "throughput": 6205.98, "total_tokens": 1210664} {"current_steps": 1860, "total_steps": 33920, "loss": 0.71, "lr": 5.4805424528301886e-06, "epoch": 1.0966981132075473, "percentage": 5.48, "elapsed_time": "0:03:15", "remaining_time": "0:56:11", "throughput": 6206.26, "total_tokens": 1214024} {"current_steps": 1865, "total_steps": 33920, "loss": 0.3621, "lr": 5.495283018867925e-06, "epoch": 1.0996462264150944, "percentage": 5.5, "elapsed_time": "0:03:16", "remaining_time": "0:56:10", "throughput": 6206.22, "total_tokens": 1217192} {"current_steps": 1870, "total_steps": 33920, "loss": 0.5362, "lr": 5.51002358490566e-06, "epoch": 1.1025943396226414, "percentage": 5.51, "elapsed_time": "0:03:16", "remaining_time": "0:56:09", "throughput": 6205.36, "total_tokens": 1219912} {"current_steps": 1875, "total_steps": 33920, "loss": 0.5, "lr": 5.524764150943397e-06, "epoch": 1.1055424528301887, "percentage": 5.53, "elapsed_time": "0:03:17", "remaining_time": "0:56:07", "throughput": 6203.25, "total_tokens": 1222184} {"current_steps": 1880, "total_steps": 33920, "loss": 0.7646, "lr": 5.5395047169811325e-06, "epoch": 1.1084905660377358, "percentage": 5.54, "elapsed_time": "0:03:17", "remaining_time": "0:56:05", "throughput": 6202.21, "total_tokens": 1224680} {"current_steps": 1885, "total_steps": 33920, "loss": 0.7365, "lr": 5.554245283018869e-06, "epoch": 1.111438679245283, "percentage": 5.56, "elapsed_time": "0:03:17", "remaining_time": "0:56:04", "throughput": 6202.71, "total_tokens": 1228104} {"current_steps": 1890, "total_steps": 33920, "loss": 0.5355, "lr": 5.568985849056604e-06, "epoch": 1.1143867924528301, "percentage": 5.57, "elapsed_time": "0:03:18", "remaining_time": "0:56:04", "throughput": 6203.54, "total_tokens": 1231528} {"current_steps": 1895, "total_steps": 33920, "loss": 0.494, "lr": 5.58372641509434e-06, "epoch": 1.1173349056603774, "percentage": 5.59, "elapsed_time": "0:03:19", "remaining_time": "0:56:03", "throughput": 6203.49, "total_tokens": 1234728} {"current_steps": 1900, "total_steps": 33920, "loss": 0.5302, "lr": 5.5984669811320755e-06, "epoch": 1.1202830188679245, "percentage": 5.6, "elapsed_time": "0:03:19", "remaining_time": "0:56:02", "throughput": 6203.37, "total_tokens": 1237800} {"current_steps": 1905, "total_steps": 33920, "loss": 0.4128, "lr": 5.613207547169813e-06, "epoch": 1.1232311320754718, "percentage": 5.62, "elapsed_time": "0:03:20", "remaining_time": "0:56:01", "throughput": 6202.33, "total_tokens": 1240744} {"current_steps": 1910, "total_steps": 33920, "loss": 0.5518, "lr": 5.627948113207548e-06, "epoch": 1.1261792452830188, "percentage": 5.63, "elapsed_time": "0:03:20", "remaining_time": "0:56:04", "throughput": 6205.04, "total_tokens": 1245608} {"current_steps": 1915, "total_steps": 33920, "loss": 0.4392, "lr": 5.642688679245284e-06, "epoch": 1.1291273584905661, "percentage": 5.65, "elapsed_time": "0:03:21", "remaining_time": "0:56:02", "throughput": 6204.68, "total_tokens": 1248456} {"current_steps": 1920, "total_steps": 33920, "loss": 0.5152, "lr": 5.6574292452830195e-06, "epoch": 1.1320754716981132, "percentage": 5.66, "elapsed_time": "0:03:21", "remaining_time": "0:56:02", "throughput": 6206.34, "total_tokens": 1252232} {"current_steps": 1925, "total_steps": 33920, "loss": 0.5063, "lr": 5.672169811320756e-06, "epoch": 1.1350235849056605, "percentage": 5.68, "elapsed_time": "0:03:22", "remaining_time": "0:56:01", "throughput": 6205.7, "total_tokens": 1255048} {"current_steps": 1930, "total_steps": 33920, "loss": 0.5155, "lr": 5.686910377358491e-06, "epoch": 1.1379716981132075, "percentage": 5.69, "elapsed_time": "0:03:22", "remaining_time": "0:56:01", "throughput": 6206.64, "total_tokens": 1258664} {"current_steps": 1935, "total_steps": 33920, "loss": 0.6073, "lr": 5.701650943396226e-06, "epoch": 1.1409198113207548, "percentage": 5.7, "elapsed_time": "0:03:23", "remaining_time": "0:56:00", "throughput": 6206.2, "total_tokens": 1261576} {"current_steps": 1940, "total_steps": 33920, "loss": 0.4653, "lr": 5.7163915094339625e-06, "epoch": 1.1438679245283019, "percentage": 5.72, "elapsed_time": "0:03:23", "remaining_time": "0:55:58", "throughput": 6205.55, "total_tokens": 1264392} {"current_steps": 1945, "total_steps": 33920, "loss": 0.5307, "lr": 5.731132075471698e-06, "epoch": 1.146816037735849, "percentage": 5.73, "elapsed_time": "0:03:24", "remaining_time": "0:55:58", "throughput": 6205.56, "total_tokens": 1267720} {"current_steps": 1950, "total_steps": 33920, "loss": 0.4903, "lr": 5.745872641509435e-06, "epoch": 1.1497641509433962, "percentage": 5.75, "elapsed_time": "0:03:24", "remaining_time": "0:55:57", "throughput": 6205.3, "total_tokens": 1270600} {"current_steps": 1955, "total_steps": 33920, "loss": 0.7938, "lr": 5.76061320754717e-06, "epoch": 1.1527122641509433, "percentage": 5.76, "elapsed_time": "0:03:25", "remaining_time": "0:55:57", "throughput": 6205.53, "total_tokens": 1274312} {"current_steps": 1960, "total_steps": 33920, "loss": 0.577, "lr": 5.7753537735849065e-06, "epoch": 1.1556603773584906, "percentage": 5.78, "elapsed_time": "0:03:25", "remaining_time": "0:55:57", "throughput": 6206.64, "total_tokens": 1278088} {"current_steps": 1965, "total_steps": 33920, "loss": 0.5244, "lr": 5.790094339622642e-06, "epoch": 1.1586084905660377, "percentage": 5.79, "elapsed_time": "0:03:26", "remaining_time": "0:55:56", "throughput": 6207.07, "total_tokens": 1281160} {"current_steps": 1970, "total_steps": 33920, "loss": 0.5503, "lr": 5.804834905660378e-06, "epoch": 1.161556603773585, "percentage": 5.81, "elapsed_time": "0:03:26", "remaining_time": "0:55:56", "throughput": 6208.09, "total_tokens": 1284840} {"current_steps": 1975, "total_steps": 33920, "loss": 0.5648, "lr": 5.819575471698113e-06, "epoch": 1.164504716981132, "percentage": 5.82, "elapsed_time": "0:03:27", "remaining_time": "0:55:56", "throughput": 6208.62, "total_tokens": 1288232} {"current_steps": 1980, "total_steps": 33920, "loss": 0.6383, "lr": 5.8343160377358495e-06, "epoch": 1.1674528301886793, "percentage": 5.84, "elapsed_time": "0:03:27", "remaining_time": "0:55:55", "throughput": 6209.09, "total_tokens": 1291464} {"current_steps": 1985, "total_steps": 33920, "loss": 0.5669, "lr": 5.849056603773585e-06, "epoch": 1.1704009433962264, "percentage": 5.85, "elapsed_time": "0:03:28", "remaining_time": "0:55:56", "throughput": 6210.29, "total_tokens": 1295496} {"current_steps": 1990, "total_steps": 33920, "loss": 0.5102, "lr": 5.863797169811322e-06, "epoch": 1.1733490566037736, "percentage": 5.87, "elapsed_time": "0:03:29", "remaining_time": "0:55:54", "throughput": 6209.91, "total_tokens": 1298248} {"current_steps": 1995, "total_steps": 33920, "loss": 0.555, "lr": 5.878537735849057e-06, "epoch": 1.1762971698113207, "percentage": 5.88, "elapsed_time": "0:03:29", "remaining_time": "0:55:53", "throughput": 6209.77, "total_tokens": 1301416} {"current_steps": 2000, "total_steps": 33920, "loss": 0.5001, "lr": 5.8932783018867934e-06, "epoch": 1.179245283018868, "percentage": 5.9, "elapsed_time": "0:03:30", "remaining_time": "0:55:52", "throughput": 6209.22, "total_tokens": 1304168} {"current_steps": 2005, "total_steps": 33920, "loss": 0.4784, "lr": 5.908018867924529e-06, "epoch": 1.182193396226415, "percentage": 5.91, "elapsed_time": "0:03:30", "remaining_time": "0:55:57", "throughput": 6210.23, "total_tokens": 1309928} {"current_steps": 2010, "total_steps": 33920, "loss": 0.3776, "lr": 5.922759433962265e-06, "epoch": 1.1851415094339623, "percentage": 5.93, "elapsed_time": "0:03:31", "remaining_time": "0:55:56", "throughput": 6207.98, "total_tokens": 1312424} {"current_steps": 2015, "total_steps": 33920, "loss": 0.6335, "lr": 5.9375e-06, "epoch": 1.1880896226415094, "percentage": 5.94, "elapsed_time": "0:03:31", "remaining_time": "0:55:54", "throughput": 6207.68, "total_tokens": 1315272} {"current_steps": 2020, "total_steps": 33920, "loss": 0.4161, "lr": 5.952240566037736e-06, "epoch": 1.1910377358490567, "percentage": 5.96, "elapsed_time": "0:03:32", "remaining_time": "0:55:54", "throughput": 6208.48, "total_tokens": 1318632} {"current_steps": 2025, "total_steps": 33920, "loss": 0.6086, "lr": 5.966981132075472e-06, "epoch": 1.1939858490566038, "percentage": 5.97, "elapsed_time": "0:03:32", "remaining_time": "0:55:54", "throughput": 6209.76, "total_tokens": 1322504} {"current_steps": 2030, "total_steps": 33920, "loss": 0.6115, "lr": 5.981721698113207e-06, "epoch": 1.196933962264151, "percentage": 5.98, "elapsed_time": "0:03:33", "remaining_time": "0:55:55", "throughput": 6209.53, "total_tokens": 1326184} {"current_steps": 2035, "total_steps": 33920, "loss": 0.5803, "lr": 5.996462264150944e-06, "epoch": 1.1998820754716981, "percentage": 6.0, "elapsed_time": "0:03:34", "remaining_time": "0:55:53", "throughput": 6209.57, "total_tokens": 1329128} {"current_steps": 2040, "total_steps": 33920, "loss": 0.3544, "lr": 6.01120283018868e-06, "epoch": 1.2028301886792452, "percentage": 6.01, "elapsed_time": "0:03:34", "remaining_time": "0:55:57", "throughput": 6211.97, "total_tokens": 1334568} {"current_steps": 2045, "total_steps": 33920, "loss": 0.6456, "lr": 6.025943396226416e-06, "epoch": 1.2057783018867925, "percentage": 6.03, "elapsed_time": "0:03:35", "remaining_time": "0:55:56", "throughput": 6212.95, "total_tokens": 1338024} {"current_steps": 2050, "total_steps": 33920, "loss": 0.401, "lr": 6.040683962264151e-06, "epoch": 1.2087264150943395, "percentage": 6.04, "elapsed_time": "0:03:35", "remaining_time": "0:55:56", "throughput": 6213.75, "total_tokens": 1341672} {"current_steps": 2055, "total_steps": 33920, "loss": 0.5664, "lr": 6.055424528301887e-06, "epoch": 1.2116745283018868, "percentage": 6.06, "elapsed_time": "0:03:36", "remaining_time": "0:55:55", "throughput": 6211.93, "total_tokens": 1344072} {"current_steps": 2060, "total_steps": 33920, "loss": 0.5289, "lr": 6.070165094339623e-06, "epoch": 1.2146226415094339, "percentage": 6.07, "elapsed_time": "0:03:37", "remaining_time": "0:55:57", "throughput": 6214.85, "total_tokens": 1349256} {"current_steps": 2065, "total_steps": 33920, "loss": 0.5231, "lr": 6.08490566037736e-06, "epoch": 1.2175707547169812, "percentage": 6.09, "elapsed_time": "0:03:37", "remaining_time": "0:55:55", "throughput": 6212.27, "total_tokens": 1351464} {"current_steps": 2070, "total_steps": 33920, "loss": 0.6018, "lr": 6.099646226415095e-06, "epoch": 1.2205188679245282, "percentage": 6.1, "elapsed_time": "0:03:38", "remaining_time": "0:55:55", "throughput": 6212.23, "total_tokens": 1354664} {"current_steps": 2075, "total_steps": 33920, "loss": 0.5997, "lr": 6.114386792452831e-06, "epoch": 1.2234669811320755, "percentage": 6.12, "elapsed_time": "0:03:38", "remaining_time": "0:55:56", "throughput": 6213.28, "total_tokens": 1358856} {"current_steps": 2080, "total_steps": 33920, "loss": 0.4314, "lr": 6.129127358490567e-06, "epoch": 1.2264150943396226, "percentage": 6.13, "elapsed_time": "0:03:39", "remaining_time": "0:55:54", "throughput": 6211.74, "total_tokens": 1361320} {"current_steps": 2085, "total_steps": 33920, "loss": 0.6109, "lr": 6.143867924528303e-06, "epoch": 1.2293632075471699, "percentage": 6.15, "elapsed_time": "0:03:39", "remaining_time": "0:55:54", "throughput": 6211.62, "total_tokens": 1364808} {"current_steps": 2090, "total_steps": 33920, "loss": 0.6597, "lr": 6.158608490566038e-06, "epoch": 1.232311320754717, "percentage": 6.16, "elapsed_time": "0:03:40", "remaining_time": "0:55:53", "throughput": 6211.67, "total_tokens": 1367912} {"current_steps": 2095, "total_steps": 33920, "loss": 0.4178, "lr": 6.173349056603774e-06, "epoch": 1.2352594339622642, "percentage": 6.18, "elapsed_time": "0:03:40", "remaining_time": "0:55:53", "throughput": 6211.56, "total_tokens": 1371432} {"current_steps": 2100, "total_steps": 33920, "loss": 0.7139, "lr": 6.18808962264151e-06, "epoch": 1.2382075471698113, "percentage": 6.19, "elapsed_time": "0:03:41", "remaining_time": "0:55:52", "throughput": 6210.17, "total_tokens": 1373928} {"current_steps": 2105, "total_steps": 33920, "loss": 0.5577, "lr": 6.202830188679245e-06, "epoch": 1.2411556603773586, "percentage": 6.21, "elapsed_time": "0:03:41", "remaining_time": "0:55:52", "throughput": 6211.42, "total_tokens": 1377800} {"current_steps": 2110, "total_steps": 33920, "loss": 0.4557, "lr": 6.217570754716982e-06, "epoch": 1.2441037735849056, "percentage": 6.22, "elapsed_time": "0:03:42", "remaining_time": "0:55:52", "throughput": 6211.28, "total_tokens": 1381064} {"current_steps": 2115, "total_steps": 33920, "loss": 0.6226, "lr": 6.232311320754717e-06, "epoch": 1.2470518867924527, "percentage": 6.24, "elapsed_time": "0:03:42", "remaining_time": "0:55:51", "throughput": 6211.47, "total_tokens": 1384232} {"current_steps": 2120, "total_steps": 33920, "loss": 0.518, "lr": 6.2470518867924536e-06, "epoch": 1.25, "percentage": 6.25, "elapsed_time": "0:03:43", "remaining_time": "0:55:50", "throughput": 6211.12, "total_tokens": 1387240} {"current_steps": 2125, "total_steps": 33920, "loss": 0.6236, "lr": 6.261792452830189e-06, "epoch": 1.2529481132075473, "percentage": 6.26, "elapsed_time": "0:03:43", "remaining_time": "0:55:48", "throughput": 6211.41, "total_tokens": 1390248} {"current_steps": 2130, "total_steps": 33920, "loss": 0.4841, "lr": 6.276533018867925e-06, "epoch": 1.2558962264150944, "percentage": 6.28, "elapsed_time": "0:03:44", "remaining_time": "0:55:48", "throughput": 6211.74, "total_tokens": 1393768} {"current_steps": 2135, "total_steps": 33920, "loss": 0.5816, "lr": 6.2912735849056604e-06, "epoch": 1.2588443396226414, "percentage": 6.29, "elapsed_time": "0:03:44", "remaining_time": "0:55:47", "throughput": 6211.7, "total_tokens": 1396808} {"current_steps": 2140, "total_steps": 33920, "loss": 0.5023, "lr": 6.306014150943397e-06, "epoch": 1.2617924528301887, "percentage": 6.31, "elapsed_time": "0:03:45", "remaining_time": "0:55:46", "throughput": 6211.09, "total_tokens": 1399656} {"current_steps": 2145, "total_steps": 33920, "loss": 0.506, "lr": 6.320754716981132e-06, "epoch": 1.2647405660377358, "percentage": 6.32, "elapsed_time": "0:03:45", "remaining_time": "0:55:46", "throughput": 6210.05, "total_tokens": 1402792} {"current_steps": 2150, "total_steps": 33920, "loss": 0.5521, "lr": 6.335495283018869e-06, "epoch": 1.267688679245283, "percentage": 6.34, "elapsed_time": "0:03:46", "remaining_time": "0:55:44", "throughput": 6208.68, "total_tokens": 1405160} {"current_steps": 2155, "total_steps": 33920, "loss": 0.5534, "lr": 6.350235849056604e-06, "epoch": 1.2706367924528301, "percentage": 6.35, "elapsed_time": "0:03:46", "remaining_time": "0:55:45", "throughput": 6209.37, "total_tokens": 1409512} {"current_steps": 2160, "total_steps": 33920, "loss": 0.4787, "lr": 6.3649764150943406e-06, "epoch": 1.2735849056603774, "percentage": 6.37, "elapsed_time": "0:03:47", "remaining_time": "0:55:46", "throughput": 6210.61, "total_tokens": 1413672} {"current_steps": 2165, "total_steps": 33920, "loss": 0.6297, "lr": 6.379716981132076e-06, "epoch": 1.2765330188679245, "percentage": 6.38, "elapsed_time": "0:03:48", "remaining_time": "0:55:46", "throughput": 6211.02, "total_tokens": 1416968} {"current_steps": 2170, "total_steps": 33920, "loss": 0.5866, "lr": 6.394457547169812e-06, "epoch": 1.2794811320754718, "percentage": 6.4, "elapsed_time": "0:03:48", "remaining_time": "0:55:44", "throughput": 6208.29, "total_tokens": 1419208} {"current_steps": 2175, "total_steps": 33920, "loss": 0.5419, "lr": 6.4091981132075474e-06, "epoch": 1.2824292452830188, "percentage": 6.41, "elapsed_time": "0:03:49", "remaining_time": "0:55:45", "throughput": 6207.83, "total_tokens": 1422728} {"current_steps": 2180, "total_steps": 33920, "loss": 0.5076, "lr": 6.423938679245284e-06, "epoch": 1.2853773584905661, "percentage": 6.43, "elapsed_time": "0:03:49", "remaining_time": "0:55:44", "throughput": 6209.38, "total_tokens": 1426568} {"current_steps": 2185, "total_steps": 33920, "loss": 0.6449, "lr": 6.438679245283019e-06, "epoch": 1.2883254716981132, "percentage": 6.44, "elapsed_time": "0:03:50", "remaining_time": "0:55:44", "throughput": 6210.17, "total_tokens": 1430088} {"current_steps": 2190, "total_steps": 33920, "loss": 0.6354, "lr": 6.453419811320756e-06, "epoch": 1.2912735849056602, "percentage": 6.46, "elapsed_time": "0:03:50", "remaining_time": "0:55:42", "throughput": 6208.21, "total_tokens": 1432424} {"current_steps": 2195, "total_steps": 33920, "loss": 0.5598, "lr": 6.468160377358491e-06, "epoch": 1.2942216981132075, "percentage": 6.47, "elapsed_time": "0:03:51", "remaining_time": "0:55:43", "throughput": 6209.6, "total_tokens": 1436488} {"current_steps": 2200, "total_steps": 33920, "loss": 0.4876, "lr": 6.482900943396227e-06, "epoch": 1.2971698113207548, "percentage": 6.49, "elapsed_time": "0:03:51", "remaining_time": "0:55:43", "throughput": 6209.53, "total_tokens": 1439848} {"current_steps": 2205, "total_steps": 33920, "loss": 0.463, "lr": 6.497641509433963e-06, "epoch": 1.3001179245283019, "percentage": 6.5, "elapsed_time": "0:03:52", "remaining_time": "0:55:42", "throughput": 6209.67, "total_tokens": 1443176} {"current_steps": 2210, "total_steps": 33920, "loss": 0.5403, "lr": 6.512382075471698e-06, "epoch": 1.303066037735849, "percentage": 6.52, "elapsed_time": "0:03:53", "remaining_time": "0:55:52", "throughput": 6212.55, "total_tokens": 1451400} {"current_steps": 2215, "total_steps": 33920, "loss": 0.7305, "lr": 6.5271226415094344e-06, "epoch": 1.3060141509433962, "percentage": 6.53, "elapsed_time": "0:03:54", "remaining_time": "0:55:51", "throughput": 6211.62, "total_tokens": 1454280} {"current_steps": 2220, "total_steps": 33920, "loss": 0.5723, "lr": 6.54186320754717e-06, "epoch": 1.3089622641509435, "percentage": 6.54, "elapsed_time": "0:03:54", "remaining_time": "0:55:49", "throughput": 6210.5, "total_tokens": 1456904} {"current_steps": 2225, "total_steps": 33920, "loss": 0.4412, "lr": 6.556603773584907e-06, "epoch": 1.3119103773584906, "percentage": 6.56, "elapsed_time": "0:03:55", "remaining_time": "0:55:49", "throughput": 6211.74, "total_tokens": 1460712} {"current_steps": 2230, "total_steps": 33920, "loss": 0.525, "lr": 6.571344339622641e-06, "epoch": 1.3148584905660377, "percentage": 6.57, "elapsed_time": "0:03:55", "remaining_time": "0:55:50", "throughput": 6212.26, "total_tokens": 1464616} {"current_steps": 2235, "total_steps": 33920, "loss": 0.4586, "lr": 6.586084905660378e-06, "epoch": 1.317806603773585, "percentage": 6.59, "elapsed_time": "0:03:56", "remaining_time": "0:55:50", "throughput": 6213.52, "total_tokens": 1468584} {"current_steps": 2240, "total_steps": 33920, "loss": 0.4612, "lr": 6.600825471698114e-06, "epoch": 1.320754716981132, "percentage": 6.6, "elapsed_time": "0:03:56", "remaining_time": "0:55:50", "throughput": 6214.18, "total_tokens": 1472072} {"current_steps": 2245, "total_steps": 33920, "loss": 0.5793, "lr": 6.61556603773585e-06, "epoch": 1.3237028301886793, "percentage": 6.62, "elapsed_time": "0:03:57", "remaining_time": "0:55:54", "throughput": 6216.54, "total_tokens": 1477928} {"current_steps": 2250, "total_steps": 33920, "loss": 0.5162, "lr": 6.630306603773585e-06, "epoch": 1.3266509433962264, "percentage": 6.63, "elapsed_time": "0:03:58", "remaining_time": "0:55:53", "throughput": 6216.33, "total_tokens": 1481032} {"current_steps": 2255, "total_steps": 33920, "loss": 0.7315, "lr": 6.645047169811321e-06, "epoch": 1.3295990566037736, "percentage": 6.65, "elapsed_time": "0:03:58", "remaining_time": "0:55:52", "throughput": 6216.02, "total_tokens": 1484232} {"current_steps": 2260, "total_steps": 33920, "loss": 0.5708, "lr": 6.659787735849057e-06, "epoch": 1.3325471698113207, "percentage": 6.66, "elapsed_time": "0:03:59", "remaining_time": "0:55:52", "throughput": 6216.51, "total_tokens": 1487592} {"current_steps": 2265, "total_steps": 33920, "loss": 0.4436, "lr": 6.674528301886794e-06, "epoch": 1.335495283018868, "percentage": 6.68, "elapsed_time": "0:03:59", "remaining_time": "0:55:50", "throughput": 6216.37, "total_tokens": 1490344} {"current_steps": 2270, "total_steps": 33920, "loss": 0.3889, "lr": 6.689268867924529e-06, "epoch": 1.338443396226415, "percentage": 6.69, "elapsed_time": "0:04:00", "remaining_time": "0:55:49", "throughput": 6215.89, "total_tokens": 1493288} {"current_steps": 2275, "total_steps": 33920, "loss": 0.608, "lr": 6.704009433962265e-06, "epoch": 1.3413915094339623, "percentage": 6.71, "elapsed_time": "0:04:00", "remaining_time": "0:55:48", "throughput": 6215.18, "total_tokens": 1496008} {"current_steps": 2280, "total_steps": 33920, "loss": 0.6057, "lr": 6.718750000000001e-06, "epoch": 1.3443396226415094, "percentage": 6.72, "elapsed_time": "0:04:01", "remaining_time": "0:55:46", "throughput": 6215.08, "total_tokens": 1498856} {"current_steps": 2285, "total_steps": 33920, "loss": 0.5424, "lr": 6.733490566037736e-06, "epoch": 1.3472877358490565, "percentage": 6.74, "elapsed_time": "0:04:01", "remaining_time": "0:55:45", "throughput": 6214.75, "total_tokens": 1501800} {"current_steps": 2290, "total_steps": 33920, "loss": 0.5354, "lr": 6.748231132075472e-06, "epoch": 1.3502358490566038, "percentage": 6.75, "elapsed_time": "0:04:02", "remaining_time": "0:55:44", "throughput": 6215.18, "total_tokens": 1504872} {"current_steps": 2295, "total_steps": 33920, "loss": 0.5135, "lr": 6.7629716981132076e-06, "epoch": 1.353183962264151, "percentage": 6.77, "elapsed_time": "0:04:02", "remaining_time": "0:55:44", "throughput": 6215.52, "total_tokens": 1508520} {"current_steps": 2300, "total_steps": 33920, "loss": 0.4051, "lr": 6.777712264150944e-06, "epoch": 1.3561320754716981, "percentage": 6.78, "elapsed_time": "0:04:03", "remaining_time": "0:55:43", "throughput": 6215.53, "total_tokens": 1511528} {"current_steps": 2305, "total_steps": 33920, "loss": 0.5546, "lr": 6.792452830188679e-06, "epoch": 1.3590801886792452, "percentage": 6.8, "elapsed_time": "0:04:03", "remaining_time": "0:55:41", "throughput": 6215.42, "total_tokens": 1514376} {"current_steps": 2310, "total_steps": 33920, "loss": 0.4569, "lr": 6.807193396226416e-06, "epoch": 1.3620283018867925, "percentage": 6.81, "elapsed_time": "0:04:04", "remaining_time": "0:55:41", "throughput": 6216.5, "total_tokens": 1517896} {"current_steps": 2315, "total_steps": 33920, "loss": 0.419, "lr": 6.8219339622641515e-06, "epoch": 1.3649764150943398, "percentage": 6.82, "elapsed_time": "0:04:04", "remaining_time": "0:55:40", "throughput": 6217.2, "total_tokens": 1521224} {"current_steps": 2320, "total_steps": 33920, "loss": 0.5165, "lr": 6.836674528301888e-06, "epoch": 1.3679245283018868, "percentage": 6.84, "elapsed_time": "0:04:05", "remaining_time": "0:55:38", "throughput": 6216.29, "total_tokens": 1523848} {"current_steps": 2325, "total_steps": 33920, "loss": 0.3965, "lr": 6.851415094339623e-06, "epoch": 1.3708726415094339, "percentage": 6.85, "elapsed_time": "0:04:05", "remaining_time": "0:55:39", "throughput": 6217.57, "total_tokens": 1527912} {"current_steps": 2330, "total_steps": 33920, "loss": 0.5324, "lr": 6.866155660377359e-06, "epoch": 1.3738207547169812, "percentage": 6.87, "elapsed_time": "0:04:06", "remaining_time": "0:55:38", "throughput": 6217.81, "total_tokens": 1530920} {"current_steps": 2335, "total_steps": 33920, "loss": 0.5339, "lr": 6.8808962264150946e-06, "epoch": 1.3767688679245282, "percentage": 6.88, "elapsed_time": "0:04:06", "remaining_time": "0:55:38", "throughput": 6218.56, "total_tokens": 1534760} {"current_steps": 2340, "total_steps": 33920, "loss": 0.6572, "lr": 6.895636792452831e-06, "epoch": 1.3797169811320755, "percentage": 6.9, "elapsed_time": "0:04:07", "remaining_time": "0:55:39", "throughput": 6219.67, "total_tokens": 1538920} {"current_steps": 2345, "total_steps": 33920, "loss": 0.5419, "lr": 6.910377358490566e-06, "epoch": 1.3826650943396226, "percentage": 6.91, "elapsed_time": "0:04:07", "remaining_time": "0:55:37", "throughput": 6219.87, "total_tokens": 1541928} {"current_steps": 2350, "total_steps": 33920, "loss": 0.6152, "lr": 6.925117924528303e-06, "epoch": 1.3856132075471699, "percentage": 6.93, "elapsed_time": "0:04:08", "remaining_time": "0:55:37", "throughput": 6220.83, "total_tokens": 1545672} {"current_steps": 2355, "total_steps": 33920, "loss": 0.4749, "lr": 6.9398584905660385e-06, "epoch": 1.388561320754717, "percentage": 6.94, "elapsed_time": "0:04:09", "remaining_time": "0:55:37", "throughput": 6221.64, "total_tokens": 1549256} {"current_steps": 2360, "total_steps": 33920, "loss": 0.3977, "lr": 6.954599056603775e-06, "epoch": 1.3915094339622642, "percentage": 6.96, "elapsed_time": "0:04:09", "remaining_time": "0:55:35", "throughput": 6221.33, "total_tokens": 1551912} {"current_steps": 2365, "total_steps": 33920, "loss": 0.6615, "lr": 6.96933962264151e-06, "epoch": 1.3944575471698113, "percentage": 6.97, "elapsed_time": "0:04:10", "remaining_time": "0:55:36", "throughput": 6222.65, "total_tokens": 1555848} {"current_steps": 2370, "total_steps": 33920, "loss": 0.7967, "lr": 6.984080188679245e-06, "epoch": 1.3974056603773586, "percentage": 6.99, "elapsed_time": "0:04:10", "remaining_time": "0:55:35", "throughput": 6223.25, "total_tokens": 1559080} {"current_steps": 2375, "total_steps": 33920, "loss": 0.5446, "lr": 6.9988207547169815e-06, "epoch": 1.4003537735849056, "percentage": 7.0, "elapsed_time": "0:04:11", "remaining_time": "0:55:34", "throughput": 6223.54, "total_tokens": 1562216} {"current_steps": 2380, "total_steps": 33920, "loss": 0.5031, "lr": 7.013561320754717e-06, "epoch": 1.4033018867924527, "percentage": 7.02, "elapsed_time": "0:04:11", "remaining_time": "0:55:34", "throughput": 6225.33, "total_tokens": 1566568} {"current_steps": 2385, "total_steps": 33920, "loss": 0.6425, "lr": 7.028301886792454e-06, "epoch": 1.40625, "percentage": 7.03, "elapsed_time": "0:04:12", "remaining_time": "0:55:33", "throughput": 6225.43, "total_tokens": 1569608} {"current_steps": 2390, "total_steps": 33920, "loss": 0.5996, "lr": 7.043042452830188e-06, "epoch": 1.4091981132075473, "percentage": 7.05, "elapsed_time": "0:04:12", "remaining_time": "0:55:33", "throughput": 6225.8, "total_tokens": 1572968} {"current_steps": 2395, "total_steps": 33920, "loss": 0.6181, "lr": 7.0577830188679255e-06, "epoch": 1.4121462264150944, "percentage": 7.06, "elapsed_time": "0:04:13", "remaining_time": "0:55:31", "throughput": 6225.29, "total_tokens": 1575848} {"current_steps": 2400, "total_steps": 33920, "loss": 0.4485, "lr": 7.072523584905661e-06, "epoch": 1.4150943396226414, "percentage": 7.08, "elapsed_time": "0:04:13", "remaining_time": "0:55:30", "throughput": 6225.96, "total_tokens": 1579048} {"current_steps": 2405, "total_steps": 33920, "loss": 0.6, "lr": 7.087264150943397e-06, "epoch": 1.4180424528301887, "percentage": 7.09, "elapsed_time": "0:04:14", "remaining_time": "0:55:30", "throughput": 6226.64, "total_tokens": 1582408} {"current_steps": 2410, "total_steps": 33920, "loss": 0.4986, "lr": 7.102004716981132e-06, "epoch": 1.4209905660377358, "percentage": 7.1, "elapsed_time": "0:04:14", "remaining_time": "0:55:29", "throughput": 6225.64, "total_tokens": 1585320} {"current_steps": 2415, "total_steps": 33920, "loss": 0.545, "lr": 7.1167452830188685e-06, "epoch": 1.423938679245283, "percentage": 7.12, "elapsed_time": "0:04:15", "remaining_time": "0:55:28", "throughput": 6225.87, "total_tokens": 1588584} {"current_steps": 2420, "total_steps": 33920, "loss": 0.5655, "lr": 7.131485849056604e-06, "epoch": 1.4268867924528301, "percentage": 7.13, "elapsed_time": "0:04:15", "remaining_time": "0:55:27", "throughput": 6225.14, "total_tokens": 1591240} {"current_steps": 2425, "total_steps": 33920, "loss": 0.4412, "lr": 7.146226415094341e-06, "epoch": 1.4298349056603774, "percentage": 7.15, "elapsed_time": "0:04:16", "remaining_time": "0:55:27", "throughput": 6226.38, "total_tokens": 1595048} {"current_steps": 2430, "total_steps": 33920, "loss": 0.5324, "lr": 7.160966981132076e-06, "epoch": 1.4327830188679245, "percentage": 7.16, "elapsed_time": "0:04:16", "remaining_time": "0:55:26", "throughput": 6227.34, "total_tokens": 1598664} {"current_steps": 2435, "total_steps": 33920, "loss": 0.5495, "lr": 7.1757075471698125e-06, "epoch": 1.4357311320754718, "percentage": 7.18, "elapsed_time": "0:04:17", "remaining_time": "0:55:25", "throughput": 6226.6, "total_tokens": 1601288} {"current_steps": 2440, "total_steps": 33920, "loss": 0.5499, "lr": 7.190448113207548e-06, "epoch": 1.4386792452830188, "percentage": 7.19, "elapsed_time": "0:04:17", "remaining_time": "0:55:24", "throughput": 6227.18, "total_tokens": 1604552} {"current_steps": 2445, "total_steps": 33920, "loss": 0.5121, "lr": 7.205188679245284e-06, "epoch": 1.4416273584905661, "percentage": 7.21, "elapsed_time": "0:04:18", "remaining_time": "0:55:23", "throughput": 6228.27, "total_tokens": 1608168} {"current_steps": 2450, "total_steps": 33920, "loss": 0.542, "lr": 7.219929245283019e-06, "epoch": 1.4445754716981132, "percentage": 7.22, "elapsed_time": "0:04:18", "remaining_time": "0:55:22", "throughput": 6228.78, "total_tokens": 1611336} {"current_steps": 2455, "total_steps": 33920, "loss": 0.5779, "lr": 7.2346698113207555e-06, "epoch": 1.4475235849056602, "percentage": 7.24, "elapsed_time": "0:04:19", "remaining_time": "0:55:22", "throughput": 6228.86, "total_tokens": 1614760} {"current_steps": 2460, "total_steps": 33920, "loss": 0.5957, "lr": 7.249410377358491e-06, "epoch": 1.4504716981132075, "percentage": 7.25, "elapsed_time": "0:04:19", "remaining_time": "0:55:22", "throughput": 6229.76, "total_tokens": 1618376} {"current_steps": 2465, "total_steps": 33920, "loss": 0.5047, "lr": 7.264150943396226e-06, "epoch": 1.4534198113207548, "percentage": 7.27, "elapsed_time": "0:04:20", "remaining_time": "0:55:21", "throughput": 6229.19, "total_tokens": 1621256} {"current_steps": 2470, "total_steps": 33920, "loss": 0.4867, "lr": 7.278891509433963e-06, "epoch": 1.4563679245283019, "percentage": 7.28, "elapsed_time": "0:04:20", "remaining_time": "0:55:20", "throughput": 6230.09, "total_tokens": 1624808} {"current_steps": 2475, "total_steps": 33920, "loss": 0.6964, "lr": 7.293632075471699e-06, "epoch": 1.459316037735849, "percentage": 7.3, "elapsed_time": "0:04:21", "remaining_time": "0:55:19", "throughput": 6229.76, "total_tokens": 1627688} {"current_steps": 2480, "total_steps": 33920, "loss": 0.4521, "lr": 7.308372641509435e-06, "epoch": 1.4622641509433962, "percentage": 7.31, "elapsed_time": "0:04:21", "remaining_time": "0:55:18", "throughput": 6228.04, "total_tokens": 1630216} {"current_steps": 2485, "total_steps": 33920, "loss": 0.6018, "lr": 7.32311320754717e-06, "epoch": 1.4652122641509435, "percentage": 7.33, "elapsed_time": "0:04:22", "remaining_time": "0:55:17", "throughput": 6229.05, "total_tokens": 1633800} {"current_steps": 2490, "total_steps": 33920, "loss": 0.4558, "lr": 7.337853773584906e-06, "epoch": 1.4681603773584906, "percentage": 7.34, "elapsed_time": "0:04:22", "remaining_time": "0:55:16", "throughput": 6227.8, "total_tokens": 1636168} {"current_steps": 2495, "total_steps": 33920, "loss": 0.4537, "lr": 7.352594339622642e-06, "epoch": 1.4711084905660377, "percentage": 7.36, "elapsed_time": "0:04:23", "remaining_time": "0:55:14", "throughput": 6227.52, "total_tokens": 1638792} {"current_steps": 2500, "total_steps": 33920, "loss": 0.6826, "lr": 7.367334905660378e-06, "epoch": 1.474056603773585, "percentage": 7.37, "elapsed_time": "0:04:23", "remaining_time": "0:55:13", "throughput": 6227.53, "total_tokens": 1642088} {"current_steps": 2505, "total_steps": 33920, "loss": 0.4919, "lr": 7.382075471698113e-06, "epoch": 1.477004716981132, "percentage": 7.39, "elapsed_time": "0:04:24", "remaining_time": "0:55:12", "throughput": 6227.19, "total_tokens": 1644808} {"current_steps": 2510, "total_steps": 33920, "loss": 0.5272, "lr": 7.39681603773585e-06, "epoch": 1.4799528301886793, "percentage": 7.4, "elapsed_time": "0:04:24", "remaining_time": "0:55:11", "throughput": 6226.53, "total_tokens": 1647496} {"current_steps": 2515, "total_steps": 33920, "loss": 0.4371, "lr": 7.411556603773586e-06, "epoch": 1.4829009433962264, "percentage": 7.41, "elapsed_time": "0:04:25", "remaining_time": "0:55:10", "throughput": 6226.25, "total_tokens": 1650760} {"current_steps": 2520, "total_steps": 33920, "loss": 0.5664, "lr": 7.426297169811322e-06, "epoch": 1.4858490566037736, "percentage": 7.43, "elapsed_time": "0:04:25", "remaining_time": "0:55:10", "throughput": 6225.76, "total_tokens": 1653864} {"current_steps": 2525, "total_steps": 33920, "loss": 0.5064, "lr": 7.441037735849057e-06, "epoch": 1.4887971698113207, "percentage": 7.44, "elapsed_time": "0:04:26", "remaining_time": "0:55:08", "throughput": 6225.5, "total_tokens": 1656616} {"current_steps": 2530, "total_steps": 33920, "loss": 0.54, "lr": 7.455778301886793e-06, "epoch": 1.491745283018868, "percentage": 7.46, "elapsed_time": "0:04:26", "remaining_time": "0:55:07", "throughput": 6225.16, "total_tokens": 1659656} {"current_steps": 2535, "total_steps": 33920, "loss": 0.6386, "lr": 7.470518867924529e-06, "epoch": 1.494693396226415, "percentage": 7.47, "elapsed_time": "0:04:27", "remaining_time": "0:55:07", "throughput": 6225.04, "total_tokens": 1662920} {"current_steps": 2540, "total_steps": 33920, "loss": 0.6062, "lr": 7.485259433962266e-06, "epoch": 1.4976415094339623, "percentage": 7.49, "elapsed_time": "0:04:27", "remaining_time": "0:55:06", "throughput": 6225.92, "total_tokens": 1666472} {"current_steps": 2545, "total_steps": 33920, "loss": 0.4959, "lr": 7.500000000000001e-06, "epoch": 1.5005896226415094, "percentage": 7.5, "elapsed_time": "0:04:28", "remaining_time": "0:55:07", "throughput": 6227.12, "total_tokens": 1670760} {"current_steps": 2550, "total_steps": 33920, "loss": 0.5104, "lr": 7.5147405660377355e-06, "epoch": 1.5035377358490565, "percentage": 7.52, "elapsed_time": "0:04:28", "remaining_time": "0:55:07", "throughput": 6227.66, "total_tokens": 1674120} {"current_steps": 2555, "total_steps": 33920, "loss": 0.4651, "lr": 7.5294811320754726e-06, "epoch": 1.5064858490566038, "percentage": 7.53, "elapsed_time": "0:04:29", "remaining_time": "0:55:07", "throughput": 6228.34, "total_tokens": 1677960} {"current_steps": 2560, "total_steps": 33920, "loss": 0.5482, "lr": 7.544221698113208e-06, "epoch": 1.509433962264151, "percentage": 7.55, "elapsed_time": "0:04:29", "remaining_time": "0:55:06", "throughput": 6229.45, "total_tokens": 1681672} {"current_steps": 2565, "total_steps": 33920, "loss": 0.7174, "lr": 7.558962264150944e-06, "epoch": 1.5123820754716981, "percentage": 7.56, "elapsed_time": "0:04:30", "remaining_time": "0:55:06", "throughput": 6230.12, "total_tokens": 1685160} {"current_steps": 2570, "total_steps": 33920, "loss": 0.4796, "lr": 7.5737028301886795e-06, "epoch": 1.5153301886792452, "percentage": 7.58, "elapsed_time": "0:04:31", "remaining_time": "0:55:06", "throughput": 6231.08, "total_tokens": 1689032} {"current_steps": 2575, "total_steps": 33920, "loss": 0.5485, "lr": 7.588443396226416e-06, "epoch": 1.5182783018867925, "percentage": 7.59, "elapsed_time": "0:04:31", "remaining_time": "0:55:05", "throughput": 6230.25, "total_tokens": 1691816} {"current_steps": 2580, "total_steps": 33920, "loss": 0.6361, "lr": 7.603183962264151e-06, "epoch": 1.5212264150943398, "percentage": 7.61, "elapsed_time": "0:04:32", "remaining_time": "0:55:04", "throughput": 6230.56, "total_tokens": 1695016} {"current_steps": 2585, "total_steps": 33920, "loss": 0.5028, "lr": 7.617924528301888e-06, "epoch": 1.5241745283018868, "percentage": 7.62, "elapsed_time": "0:04:32", "remaining_time": "0:55:03", "throughput": 6229.87, "total_tokens": 1697704} {"current_steps": 2590, "total_steps": 33920, "loss": 0.5944, "lr": 7.632665094339623e-06, "epoch": 1.5271226415094339, "percentage": 7.64, "elapsed_time": "0:04:32", "remaining_time": "0:55:02", "throughput": 6228.5, "total_tokens": 1700232} {"current_steps": 2595, "total_steps": 33920, "loss": 0.5677, "lr": 7.64740566037736e-06, "epoch": 1.5300707547169812, "percentage": 7.65, "elapsed_time": "0:04:33", "remaining_time": "0:55:01", "throughput": 6227.98, "total_tokens": 1703144} {"current_steps": 2600, "total_steps": 33920, "loss": 0.4764, "lr": 7.662146226415095e-06, "epoch": 1.5330188679245285, "percentage": 7.67, "elapsed_time": "0:04:34", "remaining_time": "0:55:00", "throughput": 6228.27, "total_tokens": 1706600} {"current_steps": 2605, "total_steps": 33920, "loss": 0.4812, "lr": 7.676886792452832e-06, "epoch": 1.5359669811320755, "percentage": 7.68, "elapsed_time": "0:04:34", "remaining_time": "0:54:59", "throughput": 6228.68, "total_tokens": 1709864} {"current_steps": 2610, "total_steps": 33920, "loss": 0.6062, "lr": 7.691627358490567e-06, "epoch": 1.5389150943396226, "percentage": 7.69, "elapsed_time": "0:04:34", "remaining_time": "0:54:58", "throughput": 6228.67, "total_tokens": 1712776} {"current_steps": 2615, "total_steps": 33920, "loss": 0.3853, "lr": 7.706367924528303e-06, "epoch": 1.5418632075471699, "percentage": 7.71, "elapsed_time": "0:04:35", "remaining_time": "0:54:57", "throughput": 6228.71, "total_tokens": 1715688} {"current_steps": 2620, "total_steps": 33920, "loss": 0.5598, "lr": 7.721108490566038e-06, "epoch": 1.544811320754717, "percentage": 7.72, "elapsed_time": "0:04:35", "remaining_time": "0:54:56", "throughput": 6228.72, "total_tokens": 1718632} {"current_steps": 2625, "total_steps": 33920, "loss": 0.4801, "lr": 7.735849056603775e-06, "epoch": 1.547759433962264, "percentage": 7.74, "elapsed_time": "0:04:36", "remaining_time": "0:54:55", "throughput": 6228.92, "total_tokens": 1721832} {"current_steps": 2630, "total_steps": 33920, "loss": 0.431, "lr": 7.75058962264151e-06, "epoch": 1.5507075471698113, "percentage": 7.75, "elapsed_time": "0:04:36", "remaining_time": "0:54:54", "throughput": 6228.96, "total_tokens": 1724744} {"current_steps": 2635, "total_steps": 33920, "loss": 0.6774, "lr": 7.765330188679246e-06, "epoch": 1.5536556603773586, "percentage": 7.77, "elapsed_time": "0:04:37", "remaining_time": "0:54:53", "throughput": 6229.27, "total_tokens": 1727848} {"current_steps": 2640, "total_steps": 33920, "loss": 0.3957, "lr": 7.780070754716981e-06, "epoch": 1.5566037735849056, "percentage": 7.78, "elapsed_time": "0:04:37", "remaining_time": "0:54:51", "throughput": 6228.49, "total_tokens": 1730408} {"current_steps": 2645, "total_steps": 33920, "loss": 0.5313, "lr": 7.794811320754716e-06, "epoch": 1.5595518867924527, "percentage": 7.8, "elapsed_time": "0:04:38", "remaining_time": "0:54:50", "throughput": 6226.67, "total_tokens": 1732552} {"current_steps": 2650, "total_steps": 33920, "loss": 0.4426, "lr": 7.809551886792453e-06, "epoch": 1.5625, "percentage": 7.81, "elapsed_time": "0:04:38", "remaining_time": "0:54:48", "throughput": 6226.21, "total_tokens": 1735080} {"current_steps": 2655, "total_steps": 33920, "loss": 0.549, "lr": 7.824292452830189e-06, "epoch": 1.5654481132075473, "percentage": 7.83, "elapsed_time": "0:04:39", "remaining_time": "0:54:46", "throughput": 6225.49, "total_tokens": 1737672} {"current_steps": 2660, "total_steps": 33920, "loss": 0.7074, "lr": 7.839033018867926e-06, "epoch": 1.5683962264150944, "percentage": 7.84, "elapsed_time": "0:04:39", "remaining_time": "0:54:46", "throughput": 6225.83, "total_tokens": 1741352} {"current_steps": 2665, "total_steps": 33920, "loss": 0.5314, "lr": 7.853773584905661e-06, "epoch": 1.5713443396226414, "percentage": 7.86, "elapsed_time": "0:04:40", "remaining_time": "0:54:46", "throughput": 6225.64, "total_tokens": 1744360} {"current_steps": 2670, "total_steps": 33920, "loss": 0.4833, "lr": 7.868514150943397e-06, "epoch": 1.5742924528301887, "percentage": 7.87, "elapsed_time": "0:04:40", "remaining_time": "0:54:45", "throughput": 6226.61, "total_tokens": 1748136} {"current_steps": 2675, "total_steps": 33920, "loss": 0.5651, "lr": 7.883254716981132e-06, "epoch": 1.577240566037736, "percentage": 7.89, "elapsed_time": "0:04:41", "remaining_time": "0:54:45", "throughput": 6227.64, "total_tokens": 1751912} {"current_steps": 2680, "total_steps": 33920, "loss": 0.7078, "lr": 7.897995283018869e-06, "epoch": 1.580188679245283, "percentage": 7.9, "elapsed_time": "0:04:41", "remaining_time": "0:54:45", "throughput": 6228.68, "total_tokens": 1755624} {"current_steps": 2685, "total_steps": 33920, "loss": 0.6381, "lr": 7.912735849056604e-06, "epoch": 1.5831367924528301, "percentage": 7.92, "elapsed_time": "0:04:42", "remaining_time": "0:54:45", "throughput": 6229.57, "total_tokens": 1759272} {"current_steps": 2690, "total_steps": 33920, "loss": 0.3713, "lr": 7.927476415094341e-06, "epoch": 1.5860849056603774, "percentage": 7.93, "elapsed_time": "0:04:42", "remaining_time": "0:54:43", "throughput": 6228.98, "total_tokens": 1761960} {"current_steps": 2695, "total_steps": 33920, "loss": 0.6918, "lr": 7.942216981132077e-06, "epoch": 1.5890330188679245, "percentage": 7.95, "elapsed_time": "0:04:43", "remaining_time": "0:54:42", "throughput": 6228.88, "total_tokens": 1764808} {"current_steps": 2700, "total_steps": 33920, "loss": 0.5839, "lr": 7.956957547169812e-06, "epoch": 1.5919811320754715, "percentage": 7.96, "elapsed_time": "0:04:43", "remaining_time": "0:54:41", "throughput": 6229.33, "total_tokens": 1768104} {"current_steps": 2705, "total_steps": 33920, "loss": 0.6301, "lr": 7.971698113207547e-06, "epoch": 1.5949292452830188, "percentage": 7.97, "elapsed_time": "0:04:44", "remaining_time": "0:54:40", "throughput": 6228.66, "total_tokens": 1770856} {"current_steps": 2710, "total_steps": 33920, "loss": 0.6001, "lr": 7.986438679245284e-06, "epoch": 1.5978773584905661, "percentage": 7.99, "elapsed_time": "0:04:44", "remaining_time": "0:54:40", "throughput": 6229.13, "total_tokens": 1774376} {"current_steps": 2715, "total_steps": 33920, "loss": 0.5317, "lr": 8.00117924528302e-06, "epoch": 1.6008254716981132, "percentage": 8.0, "elapsed_time": "0:04:45", "remaining_time": "0:54:40", "throughput": 6229.95, "total_tokens": 1778408} {"current_steps": 2720, "total_steps": 33920, "loss": 0.5523, "lr": 8.015919811320757e-06, "epoch": 1.6037735849056602, "percentage": 8.02, "elapsed_time": "0:04:46", "remaining_time": "0:54:41", "throughput": 6231.58, "total_tokens": 1782984} {"current_steps": 2725, "total_steps": 33920, "loss": 0.6567, "lr": 8.030660377358492e-06, "epoch": 1.6067216981132075, "percentage": 8.03, "elapsed_time": "0:04:46", "remaining_time": "0:54:41", "throughput": 6231.78, "total_tokens": 1786216} {"current_steps": 2730, "total_steps": 33920, "loss": 0.6095, "lr": 8.045400943396227e-06, "epoch": 1.6096698113207548, "percentage": 8.05, "elapsed_time": "0:04:47", "remaining_time": "0:54:40", "throughput": 6230.45, "total_tokens": 1788872} {"current_steps": 2735, "total_steps": 33920, "loss": 0.453, "lr": 8.060141509433963e-06, "epoch": 1.6126179245283019, "percentage": 8.06, "elapsed_time": "0:04:47", "remaining_time": "0:54:41", "throughput": 6231.67, "total_tokens": 1793288} {"current_steps": 2740, "total_steps": 33920, "loss": 0.6921, "lr": 8.074882075471698e-06, "epoch": 1.615566037735849, "percentage": 8.08, "elapsed_time": "0:04:48", "remaining_time": "0:54:42", "throughput": 6232.6, "total_tokens": 1797800} {"current_steps": 2745, "total_steps": 33920, "loss": 0.5082, "lr": 8.089622641509435e-06, "epoch": 1.6185141509433962, "percentage": 8.09, "elapsed_time": "0:04:48", "remaining_time": "0:54:41", "throughput": 6232.86, "total_tokens": 1800936} {"current_steps": 2750, "total_steps": 33920, "loss": 0.6135, "lr": 8.10436320754717e-06, "epoch": 1.6214622641509435, "percentage": 8.11, "elapsed_time": "0:04:49", "remaining_time": "0:54:40", "throughput": 6232.34, "total_tokens": 1803560} {"current_steps": 2755, "total_steps": 33920, "loss": 0.5156, "lr": 8.119103773584906e-06, "epoch": 1.6244103773584906, "percentage": 8.12, "elapsed_time": "0:04:49", "remaining_time": "0:54:39", "throughput": 6231.38, "total_tokens": 1806280} {"current_steps": 2760, "total_steps": 33920, "loss": 0.6498, "lr": 8.133844339622641e-06, "epoch": 1.6273584905660377, "percentage": 8.14, "elapsed_time": "0:04:50", "remaining_time": "0:54:37", "throughput": 6230.89, "total_tokens": 1808904} {"current_steps": 2765, "total_steps": 33920, "loss": 0.5332, "lr": 8.148584905660378e-06, "epoch": 1.630306603773585, "percentage": 8.15, "elapsed_time": "0:04:50", "remaining_time": "0:54:36", "throughput": 6230.83, "total_tokens": 1811752} {"current_steps": 2770, "total_steps": 33920, "loss": 0.5591, "lr": 8.163325471698114e-06, "epoch": 1.6332547169811322, "percentage": 8.17, "elapsed_time": "0:04:51", "remaining_time": "0:54:36", "throughput": 6232.01, "total_tokens": 1815784} {"current_steps": 2775, "total_steps": 33920, "loss": 0.483, "lr": 8.17806603773585e-06, "epoch": 1.6362028301886793, "percentage": 8.18, "elapsed_time": "0:04:51", "remaining_time": "0:54:35", "throughput": 6231.65, "total_tokens": 1818568} {"current_steps": 2780, "total_steps": 33920, "loss": 0.5385, "lr": 8.192806603773586e-06, "epoch": 1.6391509433962264, "percentage": 8.2, "elapsed_time": "0:04:52", "remaining_time": "0:54:34", "throughput": 6231.13, "total_tokens": 1821288} {"current_steps": 2785, "total_steps": 33920, "loss": 0.4553, "lr": 8.207547169811321e-06, "epoch": 1.6420990566037736, "percentage": 8.21, "elapsed_time": "0:04:52", "remaining_time": "0:54:32", "throughput": 6230.1, "total_tokens": 1823624} {"current_steps": 2790, "total_steps": 33920, "loss": 0.717, "lr": 8.222287735849057e-06, "epoch": 1.6450471698113207, "percentage": 8.23, "elapsed_time": "0:04:53", "remaining_time": "0:54:36", "throughput": 6232.13, "total_tokens": 1830280} {"current_steps": 2795, "total_steps": 33920, "loss": 0.5962, "lr": 8.237028301886794e-06, "epoch": 1.6479952830188678, "percentage": 8.24, "elapsed_time": "0:04:54", "remaining_time": "0:54:37", "throughput": 6232.94, "total_tokens": 1834280} {"current_steps": 2800, "total_steps": 33920, "loss": 0.5397, "lr": 8.251768867924529e-06, "epoch": 1.650943396226415, "percentage": 8.25, "elapsed_time": "0:04:54", "remaining_time": "0:54:37", "throughput": 6233.26, "total_tokens": 1838408} {"current_steps": 2805, "total_steps": 33920, "loss": 0.4121, "lr": 8.266509433962266e-06, "epoch": 1.6538915094339623, "percentage": 8.27, "elapsed_time": "0:04:55", "remaining_time": "0:54:37", "throughput": 6234.4, "total_tokens": 1842280} {"current_steps": 2810, "total_steps": 33920, "loss": 0.5273, "lr": 8.281250000000001e-06, "epoch": 1.6568396226415094, "percentage": 8.28, "elapsed_time": "0:04:56", "remaining_time": "0:54:38", "throughput": 6235.02, "total_tokens": 1846504} {"current_steps": 2815, "total_steps": 33920, "loss": 0.4514, "lr": 8.295990566037737e-06, "epoch": 1.6597877358490565, "percentage": 8.3, "elapsed_time": "0:04:56", "remaining_time": "0:54:38", "throughput": 6235.01, "total_tokens": 1849864} {"current_steps": 2820, "total_steps": 33920, "loss": 0.4724, "lr": 8.310731132075472e-06, "epoch": 1.6627358490566038, "percentage": 8.31, "elapsed_time": "0:04:57", "remaining_time": "0:54:36", "throughput": 6234.96, "total_tokens": 1852648} {"current_steps": 2825, "total_steps": 33920, "loss": 0.4499, "lr": 8.325471698113207e-06, "epoch": 1.665683962264151, "percentage": 8.33, "elapsed_time": "0:04:57", "remaining_time": "0:54:36", "throughput": 6235.16, "total_tokens": 1855784} {"current_steps": 2830, "total_steps": 33920, "loss": 0.5938, "lr": 8.340212264150944e-06, "epoch": 1.6686320754716981, "percentage": 8.34, "elapsed_time": "0:04:58", "remaining_time": "0:54:35", "throughput": 6235.06, "total_tokens": 1858888} {"current_steps": 2835, "total_steps": 33920, "loss": 0.5335, "lr": 8.35495283018868e-06, "epoch": 1.6715801886792452, "percentage": 8.36, "elapsed_time": "0:04:58", "remaining_time": "0:54:33", "throughput": 6234.59, "total_tokens": 1861544} {"current_steps": 2840, "total_steps": 33920, "loss": 0.4885, "lr": 8.369693396226415e-06, "epoch": 1.6745283018867925, "percentage": 8.37, "elapsed_time": "0:04:59", "remaining_time": "0:54:33", "throughput": 6234.63, "total_tokens": 1864712} {"current_steps": 2845, "total_steps": 33920, "loss": 0.4812, "lr": 8.38443396226415e-06, "epoch": 1.6774764150943398, "percentage": 8.39, "elapsed_time": "0:04:59", "remaining_time": "0:54:32", "throughput": 6235.28, "total_tokens": 1868232} {"current_steps": 2850, "total_steps": 33920, "loss": 0.4645, "lr": 8.399174528301888e-06, "epoch": 1.6804245283018868, "percentage": 8.4, "elapsed_time": "0:05:00", "remaining_time": "0:54:32", "throughput": 6236.04, "total_tokens": 1871880} {"current_steps": 2855, "total_steps": 33920, "loss": 0.5878, "lr": 8.413915094339623e-06, "epoch": 1.6833726415094339, "percentage": 8.42, "elapsed_time": "0:05:00", "remaining_time": "0:54:31", "throughput": 6235.91, "total_tokens": 1874856} {"current_steps": 2860, "total_steps": 33920, "loss": 0.5682, "lr": 8.42865566037736e-06, "epoch": 1.6863207547169812, "percentage": 8.43, "elapsed_time": "0:05:01", "remaining_time": "0:54:30", "throughput": 6236.09, "total_tokens": 1878120} {"current_steps": 2865, "total_steps": 33920, "loss": 0.5031, "lr": 8.443396226415095e-06, "epoch": 1.6892688679245285, "percentage": 8.45, "elapsed_time": "0:05:01", "remaining_time": "0:54:29", "throughput": 6235.64, "total_tokens": 1881064} {"current_steps": 2870, "total_steps": 33920, "loss": 0.4777, "lr": 8.45813679245283e-06, "epoch": 1.6922169811320755, "percentage": 8.46, "elapsed_time": "0:05:02", "remaining_time": "0:54:29", "throughput": 6236.19, "total_tokens": 1884808} {"current_steps": 2875, "total_steps": 33920, "loss": 0.4178, "lr": 8.472877358490566e-06, "epoch": 1.6951650943396226, "percentage": 8.48, "elapsed_time": "0:05:02", "remaining_time": "0:54:29", "throughput": 6236.51, "total_tokens": 1888168} {"current_steps": 2880, "total_steps": 33920, "loss": 0.5026, "lr": 8.487617924528303e-06, "epoch": 1.6981132075471699, "percentage": 8.49, "elapsed_time": "0:05:03", "remaining_time": "0:54:27", "throughput": 6235.78, "total_tokens": 1890792} {"current_steps": 2885, "total_steps": 33920, "loss": 0.537, "lr": 8.502358490566038e-06, "epoch": 1.701061320754717, "percentage": 8.51, "elapsed_time": "0:05:03", "remaining_time": "0:54:27", "throughput": 6236.3, "total_tokens": 1894408} {"current_steps": 2890, "total_steps": 33920, "loss": 0.6238, "lr": 8.517099056603775e-06, "epoch": 1.704009433962264, "percentage": 8.52, "elapsed_time": "0:05:04", "remaining_time": "0:54:26", "throughput": 6236.16, "total_tokens": 1897480} {"current_steps": 2895, "total_steps": 33920, "loss": 0.4434, "lr": 8.53183962264151e-06, "epoch": 1.7069575471698113, "percentage": 8.53, "elapsed_time": "0:05:04", "remaining_time": "0:54:26", "throughput": 6236.7, "total_tokens": 1901032} {"current_steps": 2900, "total_steps": 33920, "loss": 0.548, "lr": 8.546580188679246e-06, "epoch": 1.7099056603773586, "percentage": 8.55, "elapsed_time": "0:05:05", "remaining_time": "0:54:25", "throughput": 6236.68, "total_tokens": 1904200} {"current_steps": 2905, "total_steps": 33920, "loss": 0.6487, "lr": 8.561320754716981e-06, "epoch": 1.7128537735849056, "percentage": 8.56, "elapsed_time": "0:05:05", "remaining_time": "0:54:24", "throughput": 6236.4, "total_tokens": 1906984} {"current_steps": 2910, "total_steps": 33920, "loss": 0.5328, "lr": 8.576061320754717e-06, "epoch": 1.7158018867924527, "percentage": 8.58, "elapsed_time": "0:05:06", "remaining_time": "0:54:24", "throughput": 6237.28, "total_tokens": 1910664} {"current_steps": 2915, "total_steps": 33920, "loss": 0.6134, "lr": 8.590801886792454e-06, "epoch": 1.71875, "percentage": 8.59, "elapsed_time": "0:05:06", "remaining_time": "0:54:23", "throughput": 6236.98, "total_tokens": 1913736} {"current_steps": 2920, "total_steps": 33920, "loss": 0.5109, "lr": 8.605542452830189e-06, "epoch": 1.7216981132075473, "percentage": 8.61, "elapsed_time": "0:05:07", "remaining_time": "0:54:22", "throughput": 6236.61, "total_tokens": 1916648} {"current_steps": 2925, "total_steps": 33920, "loss": 0.7577, "lr": 8.620283018867926e-06, "epoch": 1.7246462264150944, "percentage": 8.62, "elapsed_time": "0:05:07", "remaining_time": "0:54:21", "throughput": 6236.24, "total_tokens": 1919272} {"current_steps": 2930, "total_steps": 33920, "loss": 0.5543, "lr": 8.635023584905662e-06, "epoch": 1.7275943396226414, "percentage": 8.64, "elapsed_time": "0:05:08", "remaining_time": "0:54:20", "throughput": 6236.7, "total_tokens": 1922664} {"current_steps": 2935, "total_steps": 33920, "loss": 0.4303, "lr": 8.649764150943397e-06, "epoch": 1.7305424528301887, "percentage": 8.65, "elapsed_time": "0:05:08", "remaining_time": "0:54:19", "throughput": 6235.62, "total_tokens": 1925096} {"current_steps": 2940, "total_steps": 33920, "loss": 0.4655, "lr": 8.664504716981132e-06, "epoch": 1.733490566037736, "percentage": 8.67, "elapsed_time": "0:05:09", "remaining_time": "0:54:18", "throughput": 6235.78, "total_tokens": 1928168} {"current_steps": 2945, "total_steps": 33920, "loss": 0.5053, "lr": 8.67924528301887e-06, "epoch": 1.736438679245283, "percentage": 8.68, "elapsed_time": "0:05:09", "remaining_time": "0:54:19", "throughput": 6237.31, "total_tokens": 1932808} {"current_steps": 2950, "total_steps": 33920, "loss": 0.4913, "lr": 8.693985849056605e-06, "epoch": 1.7393867924528301, "percentage": 8.7, "elapsed_time": "0:05:10", "remaining_time": "0:54:18", "throughput": 6236.69, "total_tokens": 1935624} {"current_steps": 2955, "total_steps": 33920, "loss": 0.4896, "lr": 8.70872641509434e-06, "epoch": 1.7423349056603774, "percentage": 8.71, "elapsed_time": "0:05:10", "remaining_time": "0:54:17", "throughput": 6236.82, "total_tokens": 1938824} {"current_steps": 2960, "total_steps": 33920, "loss": 0.4742, "lr": 8.723466981132075e-06, "epoch": 1.7452830188679245, "percentage": 8.73, "elapsed_time": "0:05:11", "remaining_time": "0:54:16", "throughput": 6236.85, "total_tokens": 1941864} {"current_steps": 2965, "total_steps": 33920, "loss": 0.7312, "lr": 8.738207547169812e-06, "epoch": 1.7482311320754715, "percentage": 8.74, "elapsed_time": "0:05:11", "remaining_time": "0:54:15", "throughput": 6236.56, "total_tokens": 1944840} {"current_steps": 2970, "total_steps": 33920, "loss": 0.3845, "lr": 8.752948113207548e-06, "epoch": 1.7511792452830188, "percentage": 8.76, "elapsed_time": "0:05:12", "remaining_time": "0:54:14", "throughput": 6235.68, "total_tokens": 1947208} {"current_steps": 2975, "total_steps": 33920, "loss": 0.4721, "lr": 8.767688679245285e-06, "epoch": 1.7541273584905661, "percentage": 8.77, "elapsed_time": "0:05:12", "remaining_time": "0:54:12", "throughput": 6235.11, "total_tokens": 1949672} {"current_steps": 2980, "total_steps": 33920, "loss": 0.577, "lr": 8.78242924528302e-06, "epoch": 1.7570754716981132, "percentage": 8.79, "elapsed_time": "0:05:13", "remaining_time": "0:54:11", "throughput": 6235.11, "total_tokens": 1952616} {"current_steps": 2985, "total_steps": 33920, "loss": 0.5033, "lr": 8.797169811320755e-06, "epoch": 1.7600235849056602, "percentage": 8.8, "elapsed_time": "0:05:13", "remaining_time": "0:54:10", "throughput": 6233.96, "total_tokens": 1955016} {"current_steps": 2990, "total_steps": 33920, "loss": 0.5216, "lr": 8.81191037735849e-06, "epoch": 1.7629716981132075, "percentage": 8.81, "elapsed_time": "0:05:14", "remaining_time": "0:54:09", "throughput": 6233.53, "total_tokens": 1958088} {"current_steps": 2995, "total_steps": 33920, "loss": 0.4932, "lr": 8.826650943396226e-06, "epoch": 1.7659198113207548, "percentage": 8.83, "elapsed_time": "0:05:14", "remaining_time": "0:54:08", "throughput": 6233.12, "total_tokens": 1960712} {"current_steps": 3000, "total_steps": 33920, "loss": 0.6008, "lr": 8.841391509433963e-06, "epoch": 1.7688679245283019, "percentage": 8.84, "elapsed_time": "0:05:15", "remaining_time": "0:54:07", "throughput": 6233.87, "total_tokens": 1964488} {"current_steps": 3005, "total_steps": 33920, "loss": 0.5004, "lr": 8.856132075471698e-06, "epoch": 1.771816037735849, "percentage": 8.86, "elapsed_time": "0:05:15", "remaining_time": "0:54:07", "throughput": 6232.87, "total_tokens": 1967304} {"current_steps": 3010, "total_steps": 33920, "loss": 0.444, "lr": 8.870872641509435e-06, "epoch": 1.7747641509433962, "percentage": 8.87, "elapsed_time": "0:05:16", "remaining_time": "0:54:06", "throughput": 6233.35, "total_tokens": 1970888} {"current_steps": 3015, "total_steps": 33920, "loss": 0.6787, "lr": 8.88561320754717e-06, "epoch": 1.7777122641509435, "percentage": 8.89, "elapsed_time": "0:05:16", "remaining_time": "0:54:06", "throughput": 6233.91, "total_tokens": 1974568} {"current_steps": 3020, "total_steps": 33920, "loss": 0.5124, "lr": 8.900353773584906e-06, "epoch": 1.7806603773584906, "percentage": 8.9, "elapsed_time": "0:05:17", "remaining_time": "0:54:05", "throughput": 6233.01, "total_tokens": 1977384} {"current_steps": 3025, "total_steps": 33920, "loss": 0.5914, "lr": 8.915094339622642e-06, "epoch": 1.7836084905660377, "percentage": 8.92, "elapsed_time": "0:05:17", "remaining_time": "0:54:05", "throughput": 6233.15, "total_tokens": 1980712} {"current_steps": 3030, "total_steps": 33920, "loss": 0.4686, "lr": 8.929834905660379e-06, "epoch": 1.786556603773585, "percentage": 8.93, "elapsed_time": "0:05:18", "remaining_time": "0:54:04", "throughput": 6232.72, "total_tokens": 1983496} {"current_steps": 3035, "total_steps": 33920, "loss": 0.4699, "lr": 8.944575471698114e-06, "epoch": 1.7895047169811322, "percentage": 8.95, "elapsed_time": "0:05:18", "remaining_time": "0:54:03", "throughput": 6232.2, "total_tokens": 1986632} {"current_steps": 3040, "total_steps": 33920, "loss": 0.3655, "lr": 8.959316037735851e-06, "epoch": 1.7924528301886793, "percentage": 8.96, "elapsed_time": "0:05:19", "remaining_time": "0:54:04", "throughput": 6233.2, "total_tokens": 1990664} {"current_steps": 3045, "total_steps": 33920, "loss": 0.5044, "lr": 8.974056603773586e-06, "epoch": 1.7954009433962264, "percentage": 8.98, "elapsed_time": "0:05:19", "remaining_time": "0:54:03", "throughput": 6232.95, "total_tokens": 1993608} {"current_steps": 3050, "total_steps": 33920, "loss": 0.492, "lr": 8.988797169811322e-06, "epoch": 1.7983490566037736, "percentage": 8.99, "elapsed_time": "0:05:20", "remaining_time": "0:54:02", "throughput": 6233.63, "total_tokens": 1997192} {"current_steps": 3055, "total_steps": 33920, "loss": 0.5813, "lr": 9.003537735849057e-06, "epoch": 1.8012971698113207, "percentage": 9.01, "elapsed_time": "0:05:20", "remaining_time": "0:54:02", "throughput": 6234.72, "total_tokens": 2001224} {"current_steps": 3060, "total_steps": 33920, "loss": 0.5031, "lr": 9.018278301886794e-06, "epoch": 1.8042452830188678, "percentage": 9.02, "elapsed_time": "0:05:21", "remaining_time": "0:54:01", "throughput": 6234.07, "total_tokens": 2003848} {"current_steps": 3065, "total_steps": 33920, "loss": 0.6091, "lr": 9.03301886792453e-06, "epoch": 1.807193396226415, "percentage": 9.04, "elapsed_time": "0:05:21", "remaining_time": "0:54:00", "throughput": 6233.62, "total_tokens": 2006536} {"current_steps": 3070, "total_steps": 33920, "loss": 0.5772, "lr": 9.047759433962265e-06, "epoch": 1.8101415094339623, "percentage": 9.05, "elapsed_time": "0:05:22", "remaining_time": "0:54:00", "throughput": 6234.45, "total_tokens": 2010472} {"current_steps": 3075, "total_steps": 33920, "loss": 0.457, "lr": 9.0625e-06, "epoch": 1.8130896226415094, "percentage": 9.07, "elapsed_time": "0:05:22", "remaining_time": "0:53:59", "throughput": 6234.74, "total_tokens": 2013672} {"current_steps": 3080, "total_steps": 33920, "loss": 0.7132, "lr": 9.077240566037735e-06, "epoch": 1.8160377358490565, "percentage": 9.08, "elapsed_time": "0:05:23", "remaining_time": "0:53:58", "throughput": 6233.62, "total_tokens": 2016232} {"current_steps": 3085, "total_steps": 33920, "loss": 0.5605, "lr": 9.091981132075472e-06, "epoch": 1.8189858490566038, "percentage": 9.09, "elapsed_time": "0:05:23", "remaining_time": "0:53:57", "throughput": 6233.42, "total_tokens": 2019080} {"current_steps": 3090, "total_steps": 33920, "loss": 0.5342, "lr": 9.106721698113208e-06, "epoch": 1.821933962264151, "percentage": 9.11, "elapsed_time": "0:05:24", "remaining_time": "0:53:56", "throughput": 6233.24, "total_tokens": 2021928} {"current_steps": 3095, "total_steps": 33920, "loss": 0.569, "lr": 9.121462264150945e-06, "epoch": 1.8248820754716981, "percentage": 9.12, "elapsed_time": "0:05:24", "remaining_time": "0:53:55", "throughput": 6232.73, "total_tokens": 2024584} {"current_steps": 3100, "total_steps": 33920, "loss": 0.5409, "lr": 9.13620283018868e-06, "epoch": 1.8278301886792452, "percentage": 9.14, "elapsed_time": "0:05:25", "remaining_time": "0:53:54", "throughput": 6233.29, "total_tokens": 2028072} {"current_steps": 3105, "total_steps": 33920, "loss": 0.4276, "lr": 9.150943396226416e-06, "epoch": 1.8307783018867925, "percentage": 9.15, "elapsed_time": "0:05:25", "remaining_time": "0:53:54", "throughput": 6232.33, "total_tokens": 2031048} {"current_steps": 3110, "total_steps": 33920, "loss": 0.4951, "lr": 9.165683962264151e-06, "epoch": 1.8337264150943398, "percentage": 9.17, "elapsed_time": "0:05:26", "remaining_time": "0:53:53", "throughput": 6231.81, "total_tokens": 2033896} {"current_steps": 3115, "total_steps": 33920, "loss": 0.5943, "lr": 9.180424528301888e-06, "epoch": 1.8366745283018868, "percentage": 9.18, "elapsed_time": "0:05:26", "remaining_time": "0:53:52", "throughput": 6230.39, "total_tokens": 2036232} {"current_steps": 3120, "total_steps": 33920, "loss": 0.5577, "lr": 9.195165094339623e-06, "epoch": 1.8396226415094339, "percentage": 9.2, "elapsed_time": "0:05:27", "remaining_time": "0:53:51", "throughput": 6230.0, "total_tokens": 2039208} {"current_steps": 3125, "total_steps": 33920, "loss": 0.3829, "lr": 9.20990566037736e-06, "epoch": 1.8425707547169812, "percentage": 9.21, "elapsed_time": "0:05:27", "remaining_time": "0:53:50", "throughput": 6229.88, "total_tokens": 2041992} {"current_steps": 3130, "total_steps": 33920, "loss": 0.4404, "lr": 9.224646226415096e-06, "epoch": 1.8455188679245285, "percentage": 9.23, "elapsed_time": "0:05:28", "remaining_time": "0:53:49", "throughput": 6229.92, "total_tokens": 2045480} {"current_steps": 3135, "total_steps": 33920, "loss": 0.4147, "lr": 9.239386792452831e-06, "epoch": 1.8484669811320755, "percentage": 9.24, "elapsed_time": "0:05:28", "remaining_time": "0:53:49", "throughput": 6230.6, "total_tokens": 2049224} {"current_steps": 3140, "total_steps": 33920, "loss": 0.7019, "lr": 9.254127358490566e-06, "epoch": 1.8514150943396226, "percentage": 9.26, "elapsed_time": "0:05:29", "remaining_time": "0:53:49", "throughput": 6231.23, "total_tokens": 2052680} {"current_steps": 3145, "total_steps": 33920, "loss": 0.4869, "lr": 9.268867924528303e-06, "epoch": 1.8543632075471699, "percentage": 9.27, "elapsed_time": "0:05:29", "remaining_time": "0:53:48", "throughput": 6231.5, "total_tokens": 2055912} {"current_steps": 3150, "total_steps": 33920, "loss": 0.5925, "lr": 9.283608490566039e-06, "epoch": 1.857311320754717, "percentage": 9.29, "elapsed_time": "0:05:30", "remaining_time": "0:53:48", "throughput": 6232.21, "total_tokens": 2059496} {"current_steps": 3155, "total_steps": 33920, "loss": 0.5065, "lr": 9.298349056603774e-06, "epoch": 1.860259433962264, "percentage": 9.3, "elapsed_time": "0:05:30", "remaining_time": "0:53:47", "throughput": 6232.3, "total_tokens": 2062600} {"current_steps": 3160, "total_steps": 33920, "loss": 0.4166, "lr": 9.31308962264151e-06, "epoch": 1.8632075471698113, "percentage": 9.32, "elapsed_time": "0:05:31", "remaining_time": "0:53:46", "throughput": 6232.22, "total_tokens": 2065704} {"current_steps": 3165, "total_steps": 33920, "loss": 0.4984, "lr": 9.327830188679245e-06, "epoch": 1.8661556603773586, "percentage": 9.33, "elapsed_time": "0:05:31", "remaining_time": "0:53:45", "throughput": 6230.91, "total_tokens": 2068104} {"current_steps": 3170, "total_steps": 33920, "loss": 0.6733, "lr": 9.342570754716982e-06, "epoch": 1.8691037735849056, "percentage": 9.35, "elapsed_time": "0:05:32", "remaining_time": "0:53:44", "throughput": 6230.87, "total_tokens": 2071240} {"current_steps": 3175, "total_steps": 33920, "loss": 0.4775, "lr": 9.357311320754717e-06, "epoch": 1.8720518867924527, "percentage": 9.36, "elapsed_time": "0:05:33", "remaining_time": "0:53:46", "throughput": 6232.52, "total_tokens": 2076456} {"current_steps": 3180, "total_steps": 33920, "loss": 0.4993, "lr": 9.372051886792454e-06, "epoch": 1.875, "percentage": 9.38, "elapsed_time": "0:05:33", "remaining_time": "0:53:45", "throughput": 6232.95, "total_tokens": 2079720} {"current_steps": 3185, "total_steps": 33920, "loss": 0.7159, "lr": 9.38679245283019e-06, "epoch": 1.8779481132075473, "percentage": 9.39, "elapsed_time": "0:05:34", "remaining_time": "0:53:45", "throughput": 6233.41, "total_tokens": 2083528} {"current_steps": 3190, "total_steps": 33920, "loss": 0.5269, "lr": 9.401533018867925e-06, "epoch": 1.8808962264150944, "percentage": 9.4, "elapsed_time": "0:05:34", "remaining_time": "0:53:45", "throughput": 6234.21, "total_tokens": 2087400} {"current_steps": 3195, "total_steps": 33920, "loss": 0.4166, "lr": 9.41627358490566e-06, "epoch": 1.8838443396226414, "percentage": 9.42, "elapsed_time": "0:05:35", "remaining_time": "0:53:45", "throughput": 6234.69, "total_tokens": 2091176} {"current_steps": 3200, "total_steps": 33920, "loss": 0.4323, "lr": 9.431014150943397e-06, "epoch": 1.8867924528301887, "percentage": 9.43, "elapsed_time": "0:05:35", "remaining_time": "0:53:44", "throughput": 6234.28, "total_tokens": 2093928} {"current_steps": 3205, "total_steps": 33920, "loss": 0.4202, "lr": 9.445754716981133e-06, "epoch": 1.889740566037736, "percentage": 9.45, "elapsed_time": "0:05:36", "remaining_time": "0:53:44", "throughput": 6235.04, "total_tokens": 2097992} {"current_steps": 3210, "total_steps": 33920, "loss": 0.5423, "lr": 9.46049528301887e-06, "epoch": 1.892688679245283, "percentage": 9.46, "elapsed_time": "0:05:37", "remaining_time": "0:53:44", "throughput": 6235.1, "total_tokens": 2101256} {"current_steps": 3215, "total_steps": 33920, "loss": 0.4868, "lr": 9.475235849056605e-06, "epoch": 1.8956367924528301, "percentage": 9.48, "elapsed_time": "0:05:37", "remaining_time": "0:53:43", "throughput": 6235.11, "total_tokens": 2104488} {"current_steps": 3220, "total_steps": 33920, "loss": 0.475, "lr": 9.48997641509434e-06, "epoch": 1.8985849056603774, "percentage": 9.49, "elapsed_time": "0:05:38", "remaining_time": "0:53:42", "throughput": 6234.39, "total_tokens": 2107464} {"current_steps": 3225, "total_steps": 33920, "loss": 0.7006, "lr": 9.504716981132076e-06, "epoch": 1.9015330188679245, "percentage": 9.51, "elapsed_time": "0:05:38", "remaining_time": "0:53:41", "throughput": 6234.07, "total_tokens": 2110280} {"current_steps": 3230, "total_steps": 33920, "loss": 0.5718, "lr": 9.519457547169813e-06, "epoch": 1.9044811320754715, "percentage": 9.52, "elapsed_time": "0:05:39", "remaining_time": "0:53:41", "throughput": 6234.09, "total_tokens": 2113384} {"current_steps": 3235, "total_steps": 33920, "loss": 0.5183, "lr": 9.534198113207548e-06, "epoch": 1.9074292452830188, "percentage": 9.54, "elapsed_time": "0:05:39", "remaining_time": "0:53:40", "throughput": 6234.41, "total_tokens": 2116520} {"current_steps": 3240, "total_steps": 33920, "loss": 0.5145, "lr": 9.548938679245285e-06, "epoch": 1.9103773584905661, "percentage": 9.55, "elapsed_time": "0:05:39", "remaining_time": "0:53:39", "throughput": 6234.6, "total_tokens": 2119528} {"current_steps": 3245, "total_steps": 33920, "loss": 0.4883, "lr": 9.56367924528302e-06, "epoch": 1.9133254716981132, "percentage": 9.57, "elapsed_time": "0:05:40", "remaining_time": "0:53:38", "throughput": 6234.13, "total_tokens": 2122440} {"current_steps": 3250, "total_steps": 33920, "loss": 0.5062, "lr": 9.578419811320756e-06, "epoch": 1.9162735849056602, "percentage": 9.58, "elapsed_time": "0:05:40", "remaining_time": "0:53:37", "throughput": 6234.12, "total_tokens": 2125352} {"current_steps": 3255, "total_steps": 33920, "loss": 0.5346, "lr": 9.593160377358491e-06, "epoch": 1.9192216981132075, "percentage": 9.6, "elapsed_time": "0:05:41", "remaining_time": "0:53:36", "throughput": 6234.11, "total_tokens": 2128680} {"current_steps": 3260, "total_steps": 33920, "loss": 0.3889, "lr": 9.607900943396226e-06, "epoch": 1.9221698113207548, "percentage": 9.61, "elapsed_time": "0:05:41", "remaining_time": "0:53:36", "throughput": 6234.3, "total_tokens": 2132040} {"current_steps": 3265, "total_steps": 33920, "loss": 0.4944, "lr": 9.622641509433963e-06, "epoch": 1.9251179245283019, "percentage": 9.63, "elapsed_time": "0:05:42", "remaining_time": "0:53:36", "throughput": 6234.67, "total_tokens": 2135592} {"current_steps": 3270, "total_steps": 33920, "loss": 0.5111, "lr": 9.637382075471699e-06, "epoch": 1.928066037735849, "percentage": 9.64, "elapsed_time": "0:05:43", "remaining_time": "0:53:35", "throughput": 6234.05, "total_tokens": 2138312} {"current_steps": 3275, "total_steps": 33920, "loss": 0.5849, "lr": 9.652122641509434e-06, "epoch": 1.9310141509433962, "percentage": 9.66, "elapsed_time": "0:05:43", "remaining_time": "0:53:34", "throughput": 6233.92, "total_tokens": 2141512} {"current_steps": 3280, "total_steps": 33920, "loss": 0.4269, "lr": 9.66686320754717e-06, "epoch": 1.9339622641509435, "percentage": 9.67, "elapsed_time": "0:05:43", "remaining_time": "0:53:33", "throughput": 6231.89, "total_tokens": 2143528} {"current_steps": 3285, "total_steps": 33920, "loss": 0.5524, "lr": 9.681603773584907e-06, "epoch": 1.9369103773584906, "percentage": 9.68, "elapsed_time": "0:05:44", "remaining_time": "0:53:33", "throughput": 6232.65, "total_tokens": 2147432} {"current_steps": 3290, "total_steps": 33920, "loss": 0.5061, "lr": 9.696344339622642e-06, "epoch": 1.9398584905660377, "percentage": 9.7, "elapsed_time": "0:05:45", "remaining_time": "0:53:31", "throughput": 6231.93, "total_tokens": 2150024} {"current_steps": 3295, "total_steps": 33920, "loss": 0.4664, "lr": 9.711084905660379e-06, "epoch": 1.942806603773585, "percentage": 9.71, "elapsed_time": "0:05:45", "remaining_time": "0:53:31", "throughput": 6232.17, "total_tokens": 2153160} {"current_steps": 3300, "total_steps": 33920, "loss": 0.5878, "lr": 9.725825471698114e-06, "epoch": 1.9457547169811322, "percentage": 9.73, "elapsed_time": "0:05:45", "remaining_time": "0:53:30", "throughput": 6231.79, "total_tokens": 2155944} {"current_steps": 3305, "total_steps": 33920, "loss": 0.5118, "lr": 9.74056603773585e-06, "epoch": 1.9487028301886793, "percentage": 9.74, "elapsed_time": "0:05:46", "remaining_time": "0:53:30", "throughput": 6232.96, "total_tokens": 2160360} {"current_steps": 3310, "total_steps": 33920, "loss": 0.5316, "lr": 9.755306603773585e-06, "epoch": 1.9516509433962264, "percentage": 9.76, "elapsed_time": "0:05:47", "remaining_time": "0:53:29", "throughput": 6232.26, "total_tokens": 2163080} {"current_steps": 3315, "total_steps": 33920, "loss": 0.4617, "lr": 9.770047169811322e-06, "epoch": 1.9545990566037736, "percentage": 9.77, "elapsed_time": "0:05:47", "remaining_time": "0:53:29", "throughput": 6233.24, "total_tokens": 2167176} {"current_steps": 3320, "total_steps": 33920, "loss": 0.5588, "lr": 9.784787735849057e-06, "epoch": 1.9575471698113207, "percentage": 9.79, "elapsed_time": "0:05:48", "remaining_time": "0:53:28", "throughput": 6232.61, "total_tokens": 2169928} {"current_steps": 3325, "total_steps": 33920, "loss": 0.7276, "lr": 9.799528301886794e-06, "epoch": 1.9604952830188678, "percentage": 9.8, "elapsed_time": "0:05:48", "remaining_time": "0:53:28", "throughput": 6232.38, "total_tokens": 2172872} {"current_steps": 3330, "total_steps": 33920, "loss": 0.5249, "lr": 9.81426886792453e-06, "epoch": 1.963443396226415, "percentage": 9.82, "elapsed_time": "0:05:49", "remaining_time": "0:53:27", "throughput": 6231.96, "total_tokens": 2175752} {"current_steps": 3335, "total_steps": 33920, "loss": 0.5895, "lr": 9.829009433962265e-06, "epoch": 1.9663915094339623, "percentage": 9.83, "elapsed_time": "0:05:49", "remaining_time": "0:53:27", "throughput": 6232.41, "total_tokens": 2179528} {"current_steps": 3340, "total_steps": 33920, "loss": 0.4641, "lr": 9.84375e-06, "epoch": 1.9693396226415094, "percentage": 9.85, "elapsed_time": "0:05:50", "remaining_time": "0:53:26", "throughput": 6232.2, "total_tokens": 2182824} {"current_steps": 3345, "total_steps": 33920, "loss": 0.5313, "lr": 9.858490566037736e-06, "epoch": 1.9722877358490565, "percentage": 9.86, "elapsed_time": "0:05:50", "remaining_time": "0:53:25", "throughput": 6232.34, "total_tokens": 2185960} {"current_steps": 3350, "total_steps": 33920, "loss": 0.4859, "lr": 9.873231132075473e-06, "epoch": 1.9752358490566038, "percentage": 9.88, "elapsed_time": "0:05:51", "remaining_time": "0:53:25", "throughput": 6232.52, "total_tokens": 2189512} {"current_steps": 3355, "total_steps": 33920, "loss": 0.6377, "lr": 9.887971698113208e-06, "epoch": 1.978183962264151, "percentage": 9.89, "elapsed_time": "0:05:51", "remaining_time": "0:53:26", "throughput": 6231.73, "total_tokens": 2193064} {"current_steps": 3360, "total_steps": 33920, "loss": 0.5751, "lr": 9.902712264150945e-06, "epoch": 1.9811320754716981, "percentage": 9.91, "elapsed_time": "0:05:52", "remaining_time": "0:53:24", "throughput": 6230.88, "total_tokens": 2195560} {"current_steps": 3365, "total_steps": 33920, "loss": 0.6579, "lr": 9.917452830188679e-06, "epoch": 1.9840801886792452, "percentage": 9.92, "elapsed_time": "0:05:53", "remaining_time": "0:53:26", "throughput": 6232.25, "total_tokens": 2200616} {"current_steps": 3370, "total_steps": 33920, "loss": 0.6471, "lr": 9.932193396226416e-06, "epoch": 1.9870283018867925, "percentage": 9.94, "elapsed_time": "0:05:53", "remaining_time": "0:53:25", "throughput": 6232.45, "total_tokens": 2203880} {"current_steps": 3375, "total_steps": 33920, "loss": 0.5257, "lr": 9.946933962264151e-06, "epoch": 1.9899764150943398, "percentage": 9.95, "elapsed_time": "0:05:54", "remaining_time": "0:53:24", "throughput": 6231.87, "total_tokens": 2206664} {"current_steps": 3380, "total_steps": 33920, "loss": 0.5255, "lr": 9.961674528301888e-06, "epoch": 1.9929245283018868, "percentage": 9.96, "elapsed_time": "0:05:54", "remaining_time": "0:53:23", "throughput": 6230.36, "total_tokens": 2208808} {"current_steps": 3385, "total_steps": 33920, "loss": 0.6001, "lr": 9.976415094339624e-06, "epoch": 1.9958726415094339, "percentage": 9.98, "elapsed_time": "0:05:55", "remaining_time": "0:53:22", "throughput": 6230.44, "total_tokens": 2212200} {"current_steps": 3390, "total_steps": 33920, "loss": 0.6065, "lr": 9.991155660377359e-06, "epoch": 1.9988207547169812, "percentage": 9.99, "elapsed_time": "0:05:55", "remaining_time": "0:53:22", "throughput": 6230.63, "total_tokens": 2215656} {"current_steps": 3392, "total_steps": 33920, "eval_loss": 0.5241208672523499, "epoch": 2.0, "percentage": 10.0, "elapsed_time": "0:06:14", "remaining_time": "0:56:14", "throughput": 5911.52, "total_tokens": 2216560} {"current_steps": 3395, "total_steps": 33920, "loss": 0.4593, "lr": 9.999999894098275e-06, "epoch": 2.0017688679245285, "percentage": 10.01, "elapsed_time": "0:06:18", "remaining_time": "0:56:43", "throughput": 5860.47, "total_tokens": 2218416} {"current_steps": 3400, "total_steps": 33920, "loss": 0.4976, "lr": 9.99999870270391e-06, "epoch": 2.0047169811320753, "percentage": 10.02, "elapsed_time": "0:06:19", "remaining_time": "0:56:43", "throughput": 5860.85, "total_tokens": 2222480} {"current_steps": 3405, "total_steps": 33920, "loss": 0.4705, "lr": 9.999996187538341e-06, "epoch": 2.0076650943396226, "percentage": 10.04, "elapsed_time": "0:06:19", "remaining_time": "0:56:43", "throughput": 5858.83, "total_tokens": 2224752} {"current_steps": 3410, "total_steps": 33920, "loss": 0.4812, "lr": 9.999992348602233e-06, "epoch": 2.01061320754717, "percentage": 10.05, "elapsed_time": "0:06:20", "remaining_time": "0:56:41", "throughput": 5857.59, "total_tokens": 2227216} {"current_steps": 3415, "total_steps": 33920, "loss": 0.6215, "lr": 9.999987185896598e-06, "epoch": 2.013561320754717, "percentage": 10.07, "elapsed_time": "0:06:20", "remaining_time": "0:56:41", "throughput": 5857.21, "total_tokens": 2230224} {"current_steps": 3420, "total_steps": 33920, "loss": 0.5158, "lr": 9.99998069942281e-06, "epoch": 2.016509433962264, "percentage": 10.08, "elapsed_time": "0:06:21", "remaining_time": "0:56:41", "throughput": 5858.64, "total_tokens": 2234288} {"current_steps": 3425, "total_steps": 33920, "loss": 0.5134, "lr": 9.999972889182583e-06, "epoch": 2.0194575471698113, "percentage": 10.1, "elapsed_time": "0:06:21", "remaining_time": "0:56:40", "throughput": 5860.05, "total_tokens": 2238224} {"current_steps": 3430, "total_steps": 33920, "loss": 0.6871, "lr": 9.999963755177984e-06, "epoch": 2.0224056603773586, "percentage": 10.11, "elapsed_time": "0:06:22", "remaining_time": "0:56:39", "throughput": 5859.27, "total_tokens": 2240624} {"current_steps": 3435, "total_steps": 33920, "loss": 0.6166, "lr": 9.999953297411434e-06, "epoch": 2.025353773584906, "percentage": 10.13, "elapsed_time": "0:06:22", "remaining_time": "0:56:38", "throughput": 5859.18, "total_tokens": 2243504} {"current_steps": 3440, "total_steps": 33920, "loss": 0.5816, "lr": 9.999941515885699e-06, "epoch": 2.0283018867924527, "percentage": 10.14, "elapsed_time": "0:06:23", "remaining_time": "0:56:38", "throughput": 5860.07, "total_tokens": 2247600} {"current_steps": 3445, "total_steps": 33920, "loss": 0.5001, "lr": 9.999928410603897e-06, "epoch": 2.03125, "percentage": 10.16, "elapsed_time": "0:06:24", "remaining_time": "0:56:37", "throughput": 5860.37, "total_tokens": 2250544} {"current_steps": 3450, "total_steps": 33920, "loss": 0.5998, "lr": 9.999913981569502e-06, "epoch": 2.0341981132075473, "percentage": 10.17, "elapsed_time": "0:06:24", "remaining_time": "0:56:36", "throughput": 5860.52, "total_tokens": 2253552} {"current_steps": 3455, "total_steps": 33920, "loss": 0.5376, "lr": 9.999898228786332e-06, "epoch": 2.037146226415094, "percentage": 10.19, "elapsed_time": "0:06:25", "remaining_time": "0:56:35", "throughput": 5859.5, "total_tokens": 2256208} {"current_steps": 3460, "total_steps": 33920, "loss": 0.5176, "lr": 9.999881152258557e-06, "epoch": 2.0400943396226414, "percentage": 10.2, "elapsed_time": "0:06:25", "remaining_time": "0:56:34", "throughput": 5859.9, "total_tokens": 2259536} {"current_steps": 3465, "total_steps": 33920, "loss": 0.497, "lr": 9.999862751990697e-06, "epoch": 2.0430424528301887, "percentage": 10.22, "elapsed_time": "0:06:26", "remaining_time": "0:56:33", "throughput": 5860.18, "total_tokens": 2262448} {"current_steps": 3470, "total_steps": 33920, "loss": 0.455, "lr": 9.999843027987628e-06, "epoch": 2.045990566037736, "percentage": 10.23, "elapsed_time": "0:06:26", "remaining_time": "0:56:32", "throughput": 5861.28, "total_tokens": 2266160} {"current_steps": 3475, "total_steps": 33920, "loss": 0.5841, "lr": 9.999821980254567e-06, "epoch": 2.048938679245283, "percentage": 10.24, "elapsed_time": "0:06:27", "remaining_time": "0:56:31", "throughput": 5861.3, "total_tokens": 2269232} {"current_steps": 3480, "total_steps": 33920, "loss": 0.4524, "lr": 9.99979960879709e-06, "epoch": 2.05188679245283, "percentage": 10.26, "elapsed_time": "0:06:27", "remaining_time": "0:56:31", "throughput": 5861.73, "total_tokens": 2272720} {"current_steps": 3485, "total_steps": 33920, "loss": 0.4712, "lr": 9.99977591362112e-06, "epoch": 2.0548349056603774, "percentage": 10.27, "elapsed_time": "0:06:28", "remaining_time": "0:56:30", "throughput": 5861.96, "total_tokens": 2275632} {"current_steps": 3490, "total_steps": 33920, "loss": 0.3858, "lr": 9.999750894732927e-06, "epoch": 2.0577830188679247, "percentage": 10.29, "elapsed_time": "0:06:28", "remaining_time": "0:56:28", "throughput": 5860.71, "total_tokens": 2277936} {"current_steps": 3495, "total_steps": 33920, "loss": 0.6106, "lr": 9.999724552139136e-06, "epoch": 2.0607311320754715, "percentage": 10.3, "elapsed_time": "0:06:29", "remaining_time": "0:56:27", "throughput": 5860.5, "total_tokens": 2280624} {"current_steps": 3500, "total_steps": 33920, "loss": 0.5104, "lr": 9.999696885846724e-06, "epoch": 2.063679245283019, "percentage": 10.32, "elapsed_time": "0:06:30", "remaining_time": "0:56:31", "throughput": 5861.44, "total_tokens": 2287312} {"current_steps": 3505, "total_steps": 33920, "loss": 0.4961, "lr": 9.999667895863012e-06, "epoch": 2.066627358490566, "percentage": 10.33, "elapsed_time": "0:06:30", "remaining_time": "0:56:30", "throughput": 5860.95, "total_tokens": 2289904} {"current_steps": 3510, "total_steps": 33920, "loss": 0.4808, "lr": 9.99963758219568e-06, "epoch": 2.0695754716981134, "percentage": 10.35, "elapsed_time": "0:06:31", "remaining_time": "0:56:29", "throughput": 5861.8, "total_tokens": 2293264} {"current_steps": 3515, "total_steps": 33920, "loss": 0.454, "lr": 9.999605944852749e-06, "epoch": 2.0725235849056602, "percentage": 10.36, "elapsed_time": "0:06:31", "remaining_time": "0:56:28", "throughput": 5861.63, "total_tokens": 2296048} {"current_steps": 3520, "total_steps": 33920, "loss": 0.4187, "lr": 9.999572983842599e-06, "epoch": 2.0754716981132075, "percentage": 10.38, "elapsed_time": "0:06:32", "remaining_time": "0:56:27", "throughput": 5862.24, "total_tokens": 2299280} {"current_steps": 3525, "total_steps": 33920, "loss": 0.4511, "lr": 9.999538699173951e-06, "epoch": 2.078419811320755, "percentage": 10.39, "elapsed_time": "0:06:32", "remaining_time": "0:56:26", "throughput": 5861.83, "total_tokens": 2302128} {"current_steps": 3530, "total_steps": 33920, "loss": 0.4407, "lr": 9.99950309085589e-06, "epoch": 2.081367924528302, "percentage": 10.41, "elapsed_time": "0:06:33", "remaining_time": "0:56:27", "throughput": 5862.35, "total_tokens": 2306896} {"current_steps": 3535, "total_steps": 33920, "loss": 0.4563, "lr": 9.999466158897835e-06, "epoch": 2.084316037735849, "percentage": 10.42, "elapsed_time": "0:06:34", "remaining_time": "0:56:26", "throughput": 5862.31, "total_tokens": 2309808} {"current_steps": 3540, "total_steps": 33920, "loss": 0.566, "lr": 9.999427903309569e-06, "epoch": 2.0872641509433962, "percentage": 10.44, "elapsed_time": "0:06:34", "remaining_time": "0:56:25", "throughput": 5862.89, "total_tokens": 2313104} {"current_steps": 3545, "total_steps": 33920, "loss": 0.5894, "lr": 9.99938832410122e-06, "epoch": 2.0902122641509435, "percentage": 10.45, "elapsed_time": "0:06:35", "remaining_time": "0:56:24", "throughput": 5863.62, "total_tokens": 2316368} {"current_steps": 3550, "total_steps": 33920, "loss": 0.459, "lr": 9.999347421283267e-06, "epoch": 2.0931603773584904, "percentage": 10.47, "elapsed_time": "0:06:35", "remaining_time": "0:56:23", "throughput": 5863.15, "total_tokens": 2319184} {"current_steps": 3555, "total_steps": 33920, "loss": 0.6886, "lr": 9.999305194866538e-06, "epoch": 2.0961084905660377, "percentage": 10.48, "elapsed_time": "0:06:36", "remaining_time": "0:56:23", "throughput": 5863.7, "total_tokens": 2322896} {"current_steps": 3560, "total_steps": 33920, "loss": 0.4123, "lr": 9.99926164486221e-06, "epoch": 2.099056603773585, "percentage": 10.5, "elapsed_time": "0:06:36", "remaining_time": "0:56:22", "throughput": 5864.23, "total_tokens": 2326224} {"current_steps": 3565, "total_steps": 33920, "loss": 0.5663, "lr": 9.99921677128182e-06, "epoch": 2.1020047169811322, "percentage": 10.51, "elapsed_time": "0:06:37", "remaining_time": "0:56:21", "throughput": 5865.09, "total_tokens": 2329552} {"current_steps": 3570, "total_steps": 33920, "loss": 0.6796, "lr": 9.99917057413724e-06, "epoch": 2.104952830188679, "percentage": 10.52, "elapsed_time": "0:06:37", "remaining_time": "0:56:22", "throughput": 5867.04, "total_tokens": 2334288} {"current_steps": 3575, "total_steps": 33920, "loss": 0.5253, "lr": 9.99912305344071e-06, "epoch": 2.1079009433962264, "percentage": 10.54, "elapsed_time": "0:06:38", "remaining_time": "0:56:22", "throughput": 5866.39, "total_tokens": 2337968} {"current_steps": 3580, "total_steps": 33920, "loss": 0.4651, "lr": 9.999074209204803e-06, "epoch": 2.1108490566037736, "percentage": 10.55, "elapsed_time": "0:06:39", "remaining_time": "0:56:23", "throughput": 5867.34, "total_tokens": 2342160} {"current_steps": 3585, "total_steps": 33920, "loss": 0.4624, "lr": 9.999024041442455e-06, "epoch": 2.113797169811321, "percentage": 10.57, "elapsed_time": "0:06:39", "remaining_time": "0:56:22", "throughput": 5867.97, "total_tokens": 2346000} {"current_steps": 3590, "total_steps": 33920, "loss": 0.4804, "lr": 9.998972550166948e-06, "epoch": 2.1167452830188678, "percentage": 10.58, "elapsed_time": "0:06:40", "remaining_time": "0:56:21", "throughput": 5867.59, "total_tokens": 2348656} {"current_steps": 3595, "total_steps": 33920, "loss": 0.427, "lr": 9.998919735391915e-06, "epoch": 2.119693396226415, "percentage": 10.6, "elapsed_time": "0:06:40", "remaining_time": "0:56:20", "throughput": 5867.42, "total_tokens": 2351344} {"current_steps": 3600, "total_steps": 33920, "loss": 0.5055, "lr": 9.998865597131336e-06, "epoch": 2.1226415094339623, "percentage": 10.61, "elapsed_time": "0:06:41", "remaining_time": "0:56:19", "throughput": 5867.25, "total_tokens": 2354160} {"current_steps": 3605, "total_steps": 33920, "loss": 0.4365, "lr": 9.998810135399545e-06, "epoch": 2.1255896226415096, "percentage": 10.63, "elapsed_time": "0:06:41", "remaining_time": "0:56:18", "throughput": 5867.77, "total_tokens": 2357744} {"current_steps": 3610, "total_steps": 33920, "loss": 0.4861, "lr": 9.99875335021123e-06, "epoch": 2.1285377358490565, "percentage": 10.64, "elapsed_time": "0:06:42", "remaining_time": "0:56:18", "throughput": 5868.36, "total_tokens": 2361264} {"current_steps": 3615, "total_steps": 33920, "loss": 0.394, "lr": 9.998695241581423e-06, "epoch": 2.1314858490566038, "percentage": 10.66, "elapsed_time": "0:06:42", "remaining_time": "0:56:18", "throughput": 5869.16, "total_tokens": 2365072} {"current_steps": 3620, "total_steps": 33920, "loss": 0.5237, "lr": 9.998635809525504e-06, "epoch": 2.134433962264151, "percentage": 10.67, "elapsed_time": "0:06:43", "remaining_time": "0:56:17", "throughput": 5868.55, "total_tokens": 2367856} {"current_steps": 3625, "total_steps": 33920, "loss": 0.4819, "lr": 9.998575054059212e-06, "epoch": 2.137382075471698, "percentage": 10.69, "elapsed_time": "0:06:43", "remaining_time": "0:56:15", "throughput": 5868.47, "total_tokens": 2370576} {"current_steps": 3630, "total_steps": 33920, "loss": 0.4702, "lr": 9.998512975198633e-06, "epoch": 2.140330188679245, "percentage": 10.7, "elapsed_time": "0:06:44", "remaining_time": "0:56:14", "throughput": 5867.35, "total_tokens": 2372912} {"current_steps": 3635, "total_steps": 33920, "loss": 0.4821, "lr": 9.998449572960202e-06, "epoch": 2.1432783018867925, "percentage": 10.72, "elapsed_time": "0:06:44", "remaining_time": "0:56:14", "throughput": 5868.54, "total_tokens": 2376688} {"current_steps": 3640, "total_steps": 33920, "loss": 0.8291, "lr": 9.998384847360705e-06, "epoch": 2.1462264150943398, "percentage": 10.73, "elapsed_time": "0:06:45", "remaining_time": "0:56:13", "throughput": 5868.47, "total_tokens": 2379568} {"current_steps": 3645, "total_steps": 33920, "loss": 0.5631, "lr": 9.998318798417276e-06, "epoch": 2.1491745283018866, "percentage": 10.75, "elapsed_time": "0:06:46", "remaining_time": "0:56:12", "throughput": 5868.89, "total_tokens": 2383056} {"current_steps": 3650, "total_steps": 33920, "loss": 0.4873, "lr": 9.998251426147403e-06, "epoch": 2.152122641509434, "percentage": 10.76, "elapsed_time": "0:06:46", "remaining_time": "0:56:11", "throughput": 5868.67, "total_tokens": 2385872} {"current_steps": 3655, "total_steps": 33920, "loss": 0.5898, "lr": 9.998182730568927e-06, "epoch": 2.155070754716981, "percentage": 10.78, "elapsed_time": "0:06:47", "remaining_time": "0:56:10", "throughput": 5867.86, "total_tokens": 2388560} {"current_steps": 3660, "total_steps": 33920, "loss": 0.5721, "lr": 9.998112711700028e-06, "epoch": 2.1580188679245285, "percentage": 10.79, "elapsed_time": "0:06:47", "remaining_time": "0:56:09", "throughput": 5868.48, "total_tokens": 2392016} {"current_steps": 3665, "total_steps": 33920, "loss": 0.6504, "lr": 9.99804136955925e-06, "epoch": 2.1609669811320753, "percentage": 10.8, "elapsed_time": "0:06:48", "remaining_time": "0:56:08", "throughput": 5867.91, "total_tokens": 2394576} {"current_steps": 3670, "total_steps": 33920, "loss": 0.5721, "lr": 9.99796870416548e-06, "epoch": 2.1639150943396226, "percentage": 10.82, "elapsed_time": "0:06:48", "remaining_time": "0:56:07", "throughput": 5867.68, "total_tokens": 2397424} {"current_steps": 3675, "total_steps": 33920, "loss": 0.4476, "lr": 9.997894715537953e-06, "epoch": 2.16686320754717, "percentage": 10.83, "elapsed_time": "0:06:49", "remaining_time": "0:56:07", "throughput": 5868.35, "total_tokens": 2400848} {"current_steps": 3680, "total_steps": 33920, "loss": 0.4068, "lr": 9.997819403696263e-06, "epoch": 2.169811320754717, "percentage": 10.85, "elapsed_time": "0:06:49", "remaining_time": "0:56:06", "throughput": 5869.41, "total_tokens": 2404688} {"current_steps": 3685, "total_steps": 33920, "loss": 0.6369, "lr": 9.997742768660345e-06, "epoch": 2.172759433962264, "percentage": 10.86, "elapsed_time": "0:06:50", "remaining_time": "0:56:05", "throughput": 5869.61, "total_tokens": 2407632} {"current_steps": 3690, "total_steps": 33920, "loss": 0.456, "lr": 9.99766481045049e-06, "epoch": 2.1757075471698113, "percentage": 10.88, "elapsed_time": "0:06:50", "remaining_time": "0:56:06", "throughput": 5871.25, "total_tokens": 2412464} {"current_steps": 3695, "total_steps": 33920, "loss": 0.3509, "lr": 9.997585529087338e-06, "epoch": 2.1786556603773586, "percentage": 10.89, "elapsed_time": "0:06:51", "remaining_time": "0:56:05", "throughput": 5871.15, "total_tokens": 2415440} {"current_steps": 3700, "total_steps": 33920, "loss": 0.6574, "lr": 9.997504924591878e-06, "epoch": 2.1816037735849054, "percentage": 10.91, "elapsed_time": "0:06:51", "remaining_time": "0:56:04", "throughput": 5871.96, "total_tokens": 2418928} {"current_steps": 3705, "total_steps": 33920, "loss": 0.4771, "lr": 9.99742299698545e-06, "epoch": 2.1845518867924527, "percentage": 10.92, "elapsed_time": "0:06:52", "remaining_time": "0:56:03", "throughput": 5872.48, "total_tokens": 2422160} {"current_steps": 3710, "total_steps": 33920, "loss": 0.4365, "lr": 9.997339746289749e-06, "epoch": 2.1875, "percentage": 10.94, "elapsed_time": "0:06:53", "remaining_time": "0:56:03", "throughput": 5873.35, "total_tokens": 2426352} {"current_steps": 3715, "total_steps": 33920, "loss": 0.4523, "lr": 9.997255172526812e-06, "epoch": 2.1904481132075473, "percentage": 10.95, "elapsed_time": "0:06:53", "remaining_time": "0:56:03", "throughput": 5874.62, "total_tokens": 2430544} {"current_steps": 3720, "total_steps": 33920, "loss": 0.5889, "lr": 9.99716927571903e-06, "epoch": 2.1933962264150946, "percentage": 10.97, "elapsed_time": "0:06:54", "remaining_time": "0:56:03", "throughput": 5874.87, "total_tokens": 2433744} {"current_steps": 3725, "total_steps": 33920, "loss": 0.5652, "lr": 9.997082055889147e-06, "epoch": 2.1963443396226414, "percentage": 10.98, "elapsed_time": "0:06:54", "remaining_time": "0:56:02", "throughput": 5874.23, "total_tokens": 2436624} {"current_steps": 3730, "total_steps": 33920, "loss": 0.4681, "lr": 9.996993513060252e-06, "epoch": 2.1992924528301887, "percentage": 11.0, "elapsed_time": "0:06:55", "remaining_time": "0:56:01", "throughput": 5872.3, "total_tokens": 2438672} {"current_steps": 3735, "total_steps": 33920, "loss": 0.3877, "lr": 9.996903647255789e-06, "epoch": 2.202240566037736, "percentage": 11.01, "elapsed_time": "0:06:55", "remaining_time": "0:56:00", "throughput": 5872.82, "total_tokens": 2442256} {"current_steps": 3740, "total_steps": 33920, "loss": 0.5571, "lr": 9.99681245849955e-06, "epoch": 2.205188679245283, "percentage": 11.03, "elapsed_time": "0:06:56", "remaining_time": "0:55:59", "throughput": 5872.79, "total_tokens": 2445264} {"current_steps": 3745, "total_steps": 33920, "loss": 0.5638, "lr": 9.996719946815679e-06, "epoch": 2.20813679245283, "percentage": 11.04, "elapsed_time": "0:06:56", "remaining_time": "0:55:59", "throughput": 5873.45, "total_tokens": 2448816} {"current_steps": 3750, "total_steps": 33920, "loss": 0.5967, "lr": 9.996626112228665e-06, "epoch": 2.2110849056603774, "percentage": 11.06, "elapsed_time": "0:06:57", "remaining_time": "0:55:58", "throughput": 5872.61, "total_tokens": 2451344} {"current_steps": 3755, "total_steps": 33920, "loss": 0.3934, "lr": 9.996530954763355e-06, "epoch": 2.2140330188679247, "percentage": 11.07, "elapsed_time": "0:06:57", "remaining_time": "0:55:56", "throughput": 5872.03, "total_tokens": 2453808} {"current_steps": 3760, "total_steps": 33920, "loss": 0.3961, "lr": 9.99643447444494e-06, "epoch": 2.2169811320754715, "percentage": 11.08, "elapsed_time": "0:06:58", "remaining_time": "0:55:55", "throughput": 5872.47, "total_tokens": 2456816} {"current_steps": 3765, "total_steps": 33920, "loss": 0.5955, "lr": 9.996336671298965e-06, "epoch": 2.219929245283019, "percentage": 11.1, "elapsed_time": "0:06:58", "remaining_time": "0:55:55", "throughput": 5873.66, "total_tokens": 2460816} {"current_steps": 3770, "total_steps": 33920, "loss": 0.6665, "lr": 9.996237545351323e-06, "epoch": 2.222877358490566, "percentage": 11.11, "elapsed_time": "0:06:59", "remaining_time": "0:55:54", "throughput": 5874.02, "total_tokens": 2464016} {"current_steps": 3775, "total_steps": 33920, "loss": 0.4216, "lr": 9.996137096628259e-06, "epoch": 2.2258254716981134, "percentage": 11.13, "elapsed_time": "0:07:00", "remaining_time": "0:55:54", "throughput": 5874.62, "total_tokens": 2467536} {"current_steps": 3780, "total_steps": 33920, "loss": 0.4539, "lr": 9.996035325156366e-06, "epoch": 2.2287735849056602, "percentage": 11.14, "elapsed_time": "0:07:00", "remaining_time": "0:55:53", "throughput": 5875.15, "total_tokens": 2470928} {"current_steps": 3785, "total_steps": 33920, "loss": 0.3544, "lr": 9.995932230962589e-06, "epoch": 2.2317216981132075, "percentage": 11.16, "elapsed_time": "0:07:01", "remaining_time": "0:55:53", "throughput": 5876.19, "total_tokens": 2474928} {"current_steps": 3790, "total_steps": 33920, "loss": 0.7117, "lr": 9.995827814074223e-06, "epoch": 2.234669811320755, "percentage": 11.17, "elapsed_time": "0:07:01", "remaining_time": "0:55:52", "throughput": 5875.29, "total_tokens": 2477456} {"current_steps": 3795, "total_steps": 33920, "loss": 0.6492, "lr": 9.995722074518913e-06, "epoch": 2.237617924528302, "percentage": 11.19, "elapsed_time": "0:07:02", "remaining_time": "0:55:50", "throughput": 5874.73, "total_tokens": 2479888} {"current_steps": 3800, "total_steps": 33920, "loss": 0.2765, "lr": 9.99561501232465e-06, "epoch": 2.240566037735849, "percentage": 11.2, "elapsed_time": "0:07:02", "remaining_time": "0:55:50", "throughput": 5875.21, "total_tokens": 2483344} {"current_steps": 3805, "total_steps": 33920, "loss": 0.4672, "lr": 9.995506627519786e-06, "epoch": 2.2435141509433962, "percentage": 11.22, "elapsed_time": "0:07:03", "remaining_time": "0:55:49", "throughput": 5875.0, "total_tokens": 2486448} {"current_steps": 3810, "total_steps": 33920, "loss": 0.7162, "lr": 9.995396920133012e-06, "epoch": 2.2464622641509435, "percentage": 11.23, "elapsed_time": "0:07:03", "remaining_time": "0:55:48", "throughput": 5875.06, "total_tokens": 2489392} {"current_steps": 3815, "total_steps": 33920, "loss": 0.4994, "lr": 9.995285890193373e-06, "epoch": 2.2494103773584904, "percentage": 11.25, "elapsed_time": "0:07:04", "remaining_time": "0:55:47", "throughput": 5875.19, "total_tokens": 2492400} {"current_steps": 3820, "total_steps": 33920, "loss": 0.4635, "lr": 9.995173537730267e-06, "epoch": 2.2523584905660377, "percentage": 11.26, "elapsed_time": "0:07:04", "remaining_time": "0:55:46", "throughput": 5874.38, "total_tokens": 2495088} {"current_steps": 3825, "total_steps": 33920, "loss": 0.4547, "lr": 9.99505986277344e-06, "epoch": 2.255306603773585, "percentage": 11.28, "elapsed_time": "0:07:05", "remaining_time": "0:55:46", "throughput": 5874.89, "total_tokens": 2498640} {"current_steps": 3830, "total_steps": 33920, "loss": 0.5333, "lr": 9.994944865352986e-06, "epoch": 2.2582547169811322, "percentage": 11.29, "elapsed_time": "0:07:05", "remaining_time": "0:55:45", "throughput": 5874.26, "total_tokens": 2501424} {"current_steps": 3835, "total_steps": 33920, "loss": 0.461, "lr": 9.994828545499351e-06, "epoch": 2.261202830188679, "percentage": 11.31, "elapsed_time": "0:07:06", "remaining_time": "0:55:44", "throughput": 5874.84, "total_tokens": 2504816} {"current_steps": 3840, "total_steps": 33920, "loss": 0.6171, "lr": 9.994710903243334e-06, "epoch": 2.2641509433962264, "percentage": 11.32, "elapsed_time": "0:07:06", "remaining_time": "0:55:44", "throughput": 5875.18, "total_tokens": 2508272} {"current_steps": 3845, "total_steps": 33920, "loss": 0.5321, "lr": 9.994591938616079e-06, "epoch": 2.2670990566037736, "percentage": 11.34, "elapsed_time": "0:07:07", "remaining_time": "0:55:43", "throughput": 5875.74, "total_tokens": 2511664} {"current_steps": 3850, "total_steps": 33920, "loss": 0.646, "lr": 9.994471651649082e-06, "epoch": 2.270047169811321, "percentage": 11.35, "elapsed_time": "0:07:07", "remaining_time": "0:55:42", "throughput": 5875.69, "total_tokens": 2514384} {"current_steps": 3855, "total_steps": 33920, "loss": 0.4872, "lr": 9.99435004237419e-06, "epoch": 2.2729952830188678, "percentage": 11.36, "elapsed_time": "0:07:08", "remaining_time": "0:55:41", "throughput": 5874.94, "total_tokens": 2517136} {"current_steps": 3860, "total_steps": 33920, "loss": 0.3894, "lr": 9.9942271108236e-06, "epoch": 2.275943396226415, "percentage": 11.38, "elapsed_time": "0:07:08", "remaining_time": "0:55:40", "throughput": 5875.26, "total_tokens": 2520464} {"current_steps": 3865, "total_steps": 33920, "loss": 0.5706, "lr": 9.994102857029859e-06, "epoch": 2.2788915094339623, "percentage": 11.39, "elapsed_time": "0:07:09", "remaining_time": "0:55:39", "throughput": 5875.62, "total_tokens": 2523568} {"current_steps": 3870, "total_steps": 33920, "loss": 0.55, "lr": 9.993977281025862e-06, "epoch": 2.2818396226415096, "percentage": 11.41, "elapsed_time": "0:07:10", "remaining_time": "0:55:39", "throughput": 5876.05, "total_tokens": 2526928} {"current_steps": 3875, "total_steps": 33920, "loss": 0.53, "lr": 9.993850382844858e-06, "epoch": 2.2847877358490565, "percentage": 11.42, "elapsed_time": "0:07:10", "remaining_time": "0:55:38", "throughput": 5877.16, "total_tokens": 2530864} {"current_steps": 3880, "total_steps": 33920, "loss": 0.504, "lr": 9.993722162520443e-06, "epoch": 2.2877358490566038, "percentage": 11.44, "elapsed_time": "0:07:11", "remaining_time": "0:55:38", "throughput": 5878.02, "total_tokens": 2534992} {"current_steps": 3885, "total_steps": 33920, "loss": 0.6044, "lr": 9.993592620086564e-06, "epoch": 2.290683962264151, "percentage": 11.45, "elapsed_time": "0:07:11", "remaining_time": "0:55:38", "throughput": 5878.21, "total_tokens": 2538032} {"current_steps": 3890, "total_steps": 33920, "loss": 0.5696, "lr": 9.993461755577518e-06, "epoch": 2.293632075471698, "percentage": 11.47, "elapsed_time": "0:07:12", "remaining_time": "0:55:37", "throughput": 5877.84, "total_tokens": 2540912} {"current_steps": 3895, "total_steps": 33920, "loss": 0.3586, "lr": 9.99332956902795e-06, "epoch": 2.296580188679245, "percentage": 11.48, "elapsed_time": "0:07:12", "remaining_time": "0:55:35", "throughput": 5877.66, "total_tokens": 2543600} {"current_steps": 3900, "total_steps": 33920, "loss": 0.5448, "lr": 9.993196060472859e-06, "epoch": 2.2995283018867925, "percentage": 11.5, "elapsed_time": "0:07:13", "remaining_time": "0:55:36", "throughput": 5877.45, "total_tokens": 2547408} {"current_steps": 3905, "total_steps": 33920, "loss": 0.4536, "lr": 9.993061229947591e-06, "epoch": 2.3024764150943398, "percentage": 11.51, "elapsed_time": "0:07:13", "remaining_time": "0:55:35", "throughput": 5877.64, "total_tokens": 2550352} {"current_steps": 3910, "total_steps": 33920, "loss": 0.571, "lr": 9.992925077487845e-06, "epoch": 2.3054245283018866, "percentage": 11.53, "elapsed_time": "0:07:14", "remaining_time": "0:55:34", "throughput": 5877.72, "total_tokens": 2553456} {"current_steps": 3915, "total_steps": 33920, "loss": 0.5683, "lr": 9.992787603129666e-06, "epoch": 2.308372641509434, "percentage": 11.54, "elapsed_time": "0:07:14", "remaining_time": "0:55:33", "throughput": 5877.74, "total_tokens": 2556560} {"current_steps": 3920, "total_steps": 33920, "loss": 0.5614, "lr": 9.99264880690945e-06, "epoch": 2.311320754716981, "percentage": 11.56, "elapsed_time": "0:07:15", "remaining_time": "0:55:33", "throughput": 5878.39, "total_tokens": 2560208} {"current_steps": 3925, "total_steps": 33920, "loss": 0.5344, "lr": 9.992508688863947e-06, "epoch": 2.3142688679245285, "percentage": 11.57, "elapsed_time": "0:07:16", "remaining_time": "0:55:32", "throughput": 5877.71, "total_tokens": 2562768} {"current_steps": 3930, "total_steps": 33920, "loss": 0.4333, "lr": 9.99236724903025e-06, "epoch": 2.3172169811320753, "percentage": 11.59, "elapsed_time": "0:07:16", "remaining_time": "0:55:31", "throughput": 5878.34, "total_tokens": 2566416} {"current_steps": 3935, "total_steps": 33920, "loss": 0.5047, "lr": 9.992224487445809e-06, "epoch": 2.3201650943396226, "percentage": 11.6, "elapsed_time": "0:07:17", "remaining_time": "0:55:30", "throughput": 5878.56, "total_tokens": 2569616} {"current_steps": 3940, "total_steps": 33920, "loss": 0.4573, "lr": 9.99208040414842e-06, "epoch": 2.32311320754717, "percentage": 11.62, "elapsed_time": "0:07:17", "remaining_time": "0:55:29", "throughput": 5878.39, "total_tokens": 2572560} {"current_steps": 3945, "total_steps": 33920, "loss": 0.4473, "lr": 9.99193499917623e-06, "epoch": 2.326061320754717, "percentage": 11.63, "elapsed_time": "0:07:18", "remaining_time": "0:55:28", "throughput": 5878.54, "total_tokens": 2575312} {"current_steps": 3950, "total_steps": 33920, "loss": 0.4401, "lr": 9.991788272567735e-06, "epoch": 2.329009433962264, "percentage": 11.65, "elapsed_time": "0:07:18", "remaining_time": "0:55:27", "throughput": 5878.76, "total_tokens": 2578448} {"current_steps": 3955, "total_steps": 33920, "loss": 0.4222, "lr": 9.991640224361781e-06, "epoch": 2.3319575471698113, "percentage": 11.66, "elapsed_time": "0:07:19", "remaining_time": "0:55:27", "throughput": 5879.97, "total_tokens": 2582384} {"current_steps": 3960, "total_steps": 33920, "loss": 0.3575, "lr": 9.991490854597563e-06, "epoch": 2.3349056603773586, "percentage": 11.67, "elapsed_time": "0:07:19", "remaining_time": "0:55:26", "throughput": 5880.34, "total_tokens": 2585456} {"current_steps": 3965, "total_steps": 33920, "loss": 0.4573, "lr": 9.991340163314632e-06, "epoch": 2.3378537735849054, "percentage": 11.69, "elapsed_time": "0:07:20", "remaining_time": "0:55:27", "throughput": 5882.15, "total_tokens": 2590448} {"current_steps": 3970, "total_steps": 33920, "loss": 0.5791, "lr": 9.991188150552878e-06, "epoch": 2.3408018867924527, "percentage": 11.7, "elapsed_time": "0:07:20", "remaining_time": "0:55:26", "throughput": 5882.55, "total_tokens": 2593872} {"current_steps": 3975, "total_steps": 33920, "loss": 0.5234, "lr": 9.991034816352553e-06, "epoch": 2.34375, "percentage": 11.72, "elapsed_time": "0:07:21", "remaining_time": "0:55:25", "throughput": 5883.63, "total_tokens": 2597648} {"current_steps": 3980, "total_steps": 33920, "loss": 0.4496, "lr": 9.990880160754248e-06, "epoch": 2.3466981132075473, "percentage": 11.73, "elapsed_time": "0:07:21", "remaining_time": "0:55:24", "throughput": 5883.0, "total_tokens": 2600048} {"current_steps": 3985, "total_steps": 33920, "loss": 0.4534, "lr": 9.990724183798914e-06, "epoch": 2.3496462264150946, "percentage": 11.75, "elapsed_time": "0:07:22", "remaining_time": "0:55:24", "throughput": 5883.22, "total_tokens": 2603632} {"current_steps": 3990, "total_steps": 33920, "loss": 0.4845, "lr": 9.990566885527841e-06, "epoch": 2.3525943396226414, "percentage": 11.76, "elapsed_time": "0:07:23", "remaining_time": "0:55:23", "throughput": 5884.19, "total_tokens": 2607216} {"current_steps": 3995, "total_steps": 33920, "loss": 0.5368, "lr": 9.99040826598268e-06, "epoch": 2.3555424528301887, "percentage": 11.78, "elapsed_time": "0:07:23", "remaining_time": "0:55:22", "throughput": 5884.47, "total_tokens": 2610256} {"current_steps": 4000, "total_steps": 33920, "loss": 0.4007, "lr": 9.990248325205418e-06, "epoch": 2.358490566037736, "percentage": 11.79, "elapsed_time": "0:07:24", "remaining_time": "0:55:22", "throughput": 5884.84, "total_tokens": 2613616} {"current_steps": 4005, "total_steps": 33920, "loss": 0.5299, "lr": 9.990087063238408e-06, "epoch": 2.361438679245283, "percentage": 11.81, "elapsed_time": "0:07:24", "remaining_time": "0:55:21", "throughput": 5885.37, "total_tokens": 2617104} {"current_steps": 4010, "total_steps": 33920, "loss": 0.5633, "lr": 9.989924480124342e-06, "epoch": 2.36438679245283, "percentage": 11.82, "elapsed_time": "0:07:25", "remaining_time": "0:55:20", "throughput": 5884.97, "total_tokens": 2619856} {"current_steps": 4015, "total_steps": 33920, "loss": 0.5369, "lr": 9.989760575906264e-06, "epoch": 2.3673349056603774, "percentage": 11.84, "elapsed_time": "0:07:25", "remaining_time": "0:55:19", "throughput": 5885.55, "total_tokens": 2623344} {"current_steps": 4020, "total_steps": 33920, "loss": 0.5063, "lr": 9.98959535062757e-06, "epoch": 2.3702830188679247, "percentage": 11.85, "elapsed_time": "0:07:26", "remaining_time": "0:55:19", "throughput": 5886.52, "total_tokens": 2627024} {"current_steps": 4025, "total_steps": 33920, "loss": 0.4324, "lr": 9.989428804332002e-06, "epoch": 2.3732311320754715, "percentage": 11.87, "elapsed_time": "0:07:26", "remaining_time": "0:55:18", "throughput": 5886.7, "total_tokens": 2629968} {"current_steps": 4030, "total_steps": 33920, "loss": 0.524, "lr": 9.989260937063656e-06, "epoch": 2.376179245283019, "percentage": 11.88, "elapsed_time": "0:07:27", "remaining_time": "0:55:17", "throughput": 5886.97, "total_tokens": 2633328} {"current_steps": 4035, "total_steps": 33920, "loss": 0.4958, "lr": 9.989091748866973e-06, "epoch": 2.379127358490566, "percentage": 11.9, "elapsed_time": "0:07:27", "remaining_time": "0:55:17", "throughput": 5887.94, "total_tokens": 2637360} {"current_steps": 4040, "total_steps": 33920, "loss": 0.436, "lr": 9.988921239786748e-06, "epoch": 2.3820754716981134, "percentage": 11.91, "elapsed_time": "0:07:28", "remaining_time": "0:55:16", "throughput": 5887.99, "total_tokens": 2640496} {"current_steps": 4045, "total_steps": 33920, "loss": 0.5028, "lr": 9.988749409868124e-06, "epoch": 2.3850235849056602, "percentage": 11.93, "elapsed_time": "0:07:28", "remaining_time": "0:55:15", "throughput": 5887.74, "total_tokens": 2643280} {"current_steps": 4050, "total_steps": 33920, "loss": 0.5083, "lr": 9.988576259156593e-06, "epoch": 2.3879716981132075, "percentage": 11.94, "elapsed_time": "0:07:29", "remaining_time": "0:55:14", "throughput": 5887.41, "total_tokens": 2646000} {"current_steps": 4055, "total_steps": 33920, "loss": 0.4772, "lr": 9.988401787697996e-06, "epoch": 2.390919811320755, "percentage": 11.95, "elapsed_time": "0:07:29", "remaining_time": "0:55:14", "throughput": 5888.11, "total_tokens": 2649520} {"current_steps": 4060, "total_steps": 33920, "loss": 0.5954, "lr": 9.98822599553853e-06, "epoch": 2.393867924528302, "percentage": 11.97, "elapsed_time": "0:07:30", "remaining_time": "0:55:13", "throughput": 5888.24, "total_tokens": 2652528} {"current_steps": 4065, "total_steps": 33920, "loss": 0.519, "lr": 9.988048882724732e-06, "epoch": 2.396816037735849, "percentage": 11.98, "elapsed_time": "0:07:30", "remaining_time": "0:55:12", "throughput": 5887.81, "total_tokens": 2655184} {"current_steps": 4070, "total_steps": 33920, "loss": 0.4735, "lr": 9.987870449303497e-06, "epoch": 2.3997641509433962, "percentage": 12.0, "elapsed_time": "0:07:31", "remaining_time": "0:55:11", "throughput": 5887.34, "total_tokens": 2658192} {"current_steps": 4075, "total_steps": 33920, "loss": 0.4967, "lr": 9.98769069532206e-06, "epoch": 2.4027122641509435, "percentage": 12.01, "elapsed_time": "0:07:32", "remaining_time": "0:55:10", "throughput": 5886.78, "total_tokens": 2660944} {"current_steps": 4080, "total_steps": 33920, "loss": 0.5323, "lr": 9.98750962082802e-06, "epoch": 2.4056603773584904, "percentage": 12.03, "elapsed_time": "0:07:32", "remaining_time": "0:55:09", "throughput": 5886.01, "total_tokens": 2663280} {"current_steps": 4085, "total_steps": 33920, "loss": 0.6117, "lr": 9.987327225869312e-06, "epoch": 2.4086084905660377, "percentage": 12.04, "elapsed_time": "0:07:33", "remaining_time": "0:55:08", "throughput": 5886.48, "total_tokens": 2666576} {"current_steps": 4090, "total_steps": 33920, "loss": 0.5078, "lr": 9.987143510494225e-06, "epoch": 2.411556603773585, "percentage": 12.06, "elapsed_time": "0:07:33", "remaining_time": "0:55:07", "throughput": 5887.26, "total_tokens": 2670064} {"current_steps": 4095, "total_steps": 33920, "loss": 0.4714, "lr": 9.9869584747514e-06, "epoch": 2.4145047169811322, "percentage": 12.07, "elapsed_time": "0:07:34", "remaining_time": "0:55:07", "throughput": 5887.67, "total_tokens": 2673680} {"current_steps": 4100, "total_steps": 33920, "loss": 0.535, "lr": 9.986772118689828e-06, "epoch": 2.417452830188679, "percentage": 12.09, "elapsed_time": "0:07:34", "remaining_time": "0:55:06", "throughput": 5887.82, "total_tokens": 2676688} {"current_steps": 4105, "total_steps": 33920, "loss": 0.6292, "lr": 9.986584442358845e-06, "epoch": 2.4204009433962264, "percentage": 12.1, "elapsed_time": "0:07:35", "remaining_time": "0:55:06", "throughput": 5889.31, "total_tokens": 2681200} {"current_steps": 4110, "total_steps": 33920, "loss": 0.4655, "lr": 9.98639544580814e-06, "epoch": 2.4233490566037736, "percentage": 12.12, "elapsed_time": "0:07:35", "remaining_time": "0:55:05", "throughput": 5889.29, "total_tokens": 2684336} {"current_steps": 4115, "total_steps": 33920, "loss": 0.4135, "lr": 9.98620512908775e-06, "epoch": 2.426297169811321, "percentage": 12.13, "elapsed_time": "0:07:36", "remaining_time": "0:55:05", "throughput": 5889.26, "total_tokens": 2687344} {"current_steps": 4120, "total_steps": 33920, "loss": 0.3735, "lr": 9.986013492248064e-06, "epoch": 2.4292452830188678, "percentage": 12.15, "elapsed_time": "0:07:36", "remaining_time": "0:55:04", "throughput": 5889.22, "total_tokens": 2690224} {"current_steps": 4125, "total_steps": 33920, "loss": 0.4501, "lr": 9.985820535339817e-06, "epoch": 2.432193396226415, "percentage": 12.16, "elapsed_time": "0:07:37", "remaining_time": "0:55:03", "throughput": 5889.26, "total_tokens": 2693104} {"current_steps": 4130, "total_steps": 33920, "loss": 0.4762, "lr": 9.985626258414093e-06, "epoch": 2.4351415094339623, "percentage": 12.18, "elapsed_time": "0:07:37", "remaining_time": "0:55:01", "throughput": 5888.12, "total_tokens": 2695248} {"current_steps": 4135, "total_steps": 33920, "loss": 0.3703, "lr": 9.985430661522333e-06, "epoch": 2.4380896226415096, "percentage": 12.19, "elapsed_time": "0:07:38", "remaining_time": "0:55:01", "throughput": 5888.64, "total_tokens": 2698672} {"current_steps": 4140, "total_steps": 33920, "loss": 0.5363, "lr": 9.98523374471632e-06, "epoch": 2.4410377358490565, "percentage": 12.21, "elapsed_time": "0:07:38", "remaining_time": "0:55:00", "throughput": 5888.13, "total_tokens": 2701264} {"current_steps": 4145, "total_steps": 33920, "loss": 0.5639, "lr": 9.985035508048186e-06, "epoch": 2.4439858490566038, "percentage": 12.22, "elapsed_time": "0:07:39", "remaining_time": "0:54:59", "throughput": 5887.69, "total_tokens": 2704464} {"current_steps": 4150, "total_steps": 33920, "loss": 0.509, "lr": 9.984835951570417e-06, "epoch": 2.446933962264151, "percentage": 12.23, "elapsed_time": "0:07:39", "remaining_time": "0:54:59", "throughput": 5888.3, "total_tokens": 2708080} {"current_steps": 4155, "total_steps": 33920, "loss": 0.5347, "lr": 9.984635075335847e-06, "epoch": 2.449882075471698, "percentage": 12.25, "elapsed_time": "0:07:40", "remaining_time": "0:54:58", "throughput": 5888.1, "total_tokens": 2710832} {"current_steps": 4160, "total_steps": 33920, "loss": 0.5451, "lr": 9.984432879397659e-06, "epoch": 2.452830188679245, "percentage": 12.26, "elapsed_time": "0:07:40", "remaining_time": "0:54:57", "throughput": 5888.03, "total_tokens": 2713712} {"current_steps": 4165, "total_steps": 33920, "loss": 0.4389, "lr": 9.984229363809383e-06, "epoch": 2.4557783018867925, "percentage": 12.28, "elapsed_time": "0:07:41", "remaining_time": "0:54:56", "throughput": 5888.07, "total_tokens": 2716688} {"current_steps": 4170, "total_steps": 33920, "loss": 0.3589, "lr": 9.984024528624904e-06, "epoch": 2.4587264150943398, "percentage": 12.29, "elapsed_time": "0:07:41", "remaining_time": "0:54:55", "throughput": 5886.96, "total_tokens": 2719440} {"current_steps": 4175, "total_steps": 33920, "loss": 0.4865, "lr": 9.98381837389845e-06, "epoch": 2.4616745283018866, "percentage": 12.31, "elapsed_time": "0:07:42", "remaining_time": "0:54:54", "throughput": 5886.26, "total_tokens": 2721840} {"current_steps": 4180, "total_steps": 33920, "loss": 0.5398, "lr": 9.983610899684601e-06, "epoch": 2.464622641509434, "percentage": 12.32, "elapsed_time": "0:07:43", "remaining_time": "0:54:54", "throughput": 5887.46, "total_tokens": 2726192} {"current_steps": 4185, "total_steps": 33920, "loss": 0.5636, "lr": 9.983402106038292e-06, "epoch": 2.467570754716981, "percentage": 12.34, "elapsed_time": "0:07:43", "remaining_time": "0:54:53", "throughput": 5886.85, "total_tokens": 2728816} {"current_steps": 4190, "total_steps": 33920, "loss": 0.5628, "lr": 9.983191993014793e-06, "epoch": 2.4705188679245285, "percentage": 12.35, "elapsed_time": "0:07:44", "remaining_time": "0:54:52", "throughput": 5886.27, "total_tokens": 2731344} {"current_steps": 4195, "total_steps": 33920, "loss": 0.4141, "lr": 9.982980560669742e-06, "epoch": 2.4734669811320753, "percentage": 12.37, "elapsed_time": "0:07:44", "remaining_time": "0:54:51", "throughput": 5886.03, "total_tokens": 2734096} {"current_steps": 4200, "total_steps": 33920, "loss": 0.4932, "lr": 9.98276780905911e-06, "epoch": 2.4764150943396226, "percentage": 12.38, "elapsed_time": "0:07:45", "remaining_time": "0:54:50", "throughput": 5885.85, "total_tokens": 2737040} {"current_steps": 4205, "total_steps": 33920, "loss": 0.4105, "lr": 9.982553738239225e-06, "epoch": 2.47936320754717, "percentage": 12.4, "elapsed_time": "0:07:45", "remaining_time": "0:54:50", "throughput": 5886.04, "total_tokens": 2740528} {"current_steps": 4210, "total_steps": 33920, "loss": 0.4165, "lr": 9.982338348266766e-06, "epoch": 2.482311320754717, "percentage": 12.41, "elapsed_time": "0:07:46", "remaining_time": "0:54:49", "throughput": 5886.27, "total_tokens": 2743728} {"current_steps": 4215, "total_steps": 33920, "loss": 0.5364, "lr": 9.982121639198756e-06, "epoch": 2.485259433962264, "percentage": 12.43, "elapsed_time": "0:07:46", "remaining_time": "0:54:49", "throughput": 5887.56, "total_tokens": 2748464} {"current_steps": 4220, "total_steps": 33920, "loss": 0.5718, "lr": 9.98190361109257e-06, "epoch": 2.4882075471698113, "percentage": 12.44, "elapsed_time": "0:07:47", "remaining_time": "0:54:50", "throughput": 5888.46, "total_tokens": 2752784} {"current_steps": 4225, "total_steps": 33920, "loss": 0.7493, "lr": 9.981684264005934e-06, "epoch": 2.4911556603773586, "percentage": 12.46, "elapsed_time": "0:07:47", "remaining_time": "0:54:49", "throughput": 5888.37, "total_tokens": 2755728} {"current_steps": 4230, "total_steps": 33920, "loss": 0.4883, "lr": 9.981463597996917e-06, "epoch": 2.4941037735849054, "percentage": 12.47, "elapsed_time": "0:07:48", "remaining_time": "0:54:48", "throughput": 5888.81, "total_tokens": 2758960} {"current_steps": 4235, "total_steps": 33920, "loss": 0.532, "lr": 9.981241613123944e-06, "epoch": 2.4970518867924527, "percentage": 12.49, "elapsed_time": "0:07:49", "remaining_time": "0:54:47", "throughput": 5889.52, "total_tokens": 2762480} {"current_steps": 4240, "total_steps": 33920, "loss": 0.406, "lr": 9.981018309445785e-06, "epoch": 2.5, "percentage": 12.5, "elapsed_time": "0:07:49", "remaining_time": "0:54:46", "throughput": 5890.09, "total_tokens": 2765808} {"current_steps": 4245, "total_steps": 33920, "loss": 0.4636, "lr": 9.980793687021564e-06, "epoch": 2.5029481132075473, "percentage": 12.51, "elapsed_time": "0:07:50", "remaining_time": "0:54:46", "throughput": 5890.06, "total_tokens": 2768720} {"current_steps": 4250, "total_steps": 33920, "loss": 0.433, "lr": 9.980567745910746e-06, "epoch": 2.5058962264150946, "percentage": 12.53, "elapsed_time": "0:07:50", "remaining_time": "0:54:45", "throughput": 5890.97, "total_tokens": 2772624} {"current_steps": 4255, "total_steps": 33920, "loss": 0.76, "lr": 9.980340486173155e-06, "epoch": 2.5088443396226414, "percentage": 12.54, "elapsed_time": "0:07:51", "remaining_time": "0:54:45", "throughput": 5891.31, "total_tokens": 2776048} {"current_steps": 4260, "total_steps": 33920, "loss": 0.5102, "lr": 9.980111907868954e-06, "epoch": 2.5117924528301887, "percentage": 12.56, "elapsed_time": "0:07:51", "remaining_time": "0:54:44", "throughput": 5890.56, "total_tokens": 2778576} {"current_steps": 4265, "total_steps": 33920, "loss": 0.4261, "lr": 9.979882011058662e-06, "epoch": 2.514740566037736, "percentage": 12.57, "elapsed_time": "0:07:52", "remaining_time": "0:54:43", "throughput": 5890.32, "total_tokens": 2781328} {"current_steps": 4270, "total_steps": 33920, "loss": 0.5924, "lr": 9.979650795803146e-06, "epoch": 2.517688679245283, "percentage": 12.59, "elapsed_time": "0:07:52", "remaining_time": "0:54:42", "throughput": 5890.83, "total_tokens": 2784432} {"current_steps": 4275, "total_steps": 33920, "loss": 0.3881, "lr": 9.979418262163621e-06, "epoch": 2.52063679245283, "percentage": 12.6, "elapsed_time": "0:07:53", "remaining_time": "0:54:41", "throughput": 5890.34, "total_tokens": 2787088} {"current_steps": 4280, "total_steps": 33920, "loss": 0.4902, "lr": 9.979184410201652e-06, "epoch": 2.5235849056603774, "percentage": 12.62, "elapsed_time": "0:07:53", "remaining_time": "0:54:40", "throughput": 5890.63, "total_tokens": 2790000} {"current_steps": 4285, "total_steps": 33920, "loss": 0.4323, "lr": 9.97894923997915e-06, "epoch": 2.5265330188679247, "percentage": 12.63, "elapsed_time": "0:07:54", "remaining_time": "0:54:39", "throughput": 5890.0, "total_tokens": 2792688} {"current_steps": 4290, "total_steps": 33920, "loss": 0.5608, "lr": 9.97871275155838e-06, "epoch": 2.5294811320754715, "percentage": 12.65, "elapsed_time": "0:07:54", "remaining_time": "0:54:38", "throughput": 5890.86, "total_tokens": 2796400} {"current_steps": 4295, "total_steps": 33920, "loss": 0.5732, "lr": 9.978474945001949e-06, "epoch": 2.532429245283019, "percentage": 12.66, "elapsed_time": "0:07:55", "remaining_time": "0:54:37", "throughput": 5890.96, "total_tokens": 2799280} {"current_steps": 4300, "total_steps": 33920, "loss": 0.3648, "lr": 9.978235820372822e-06, "epoch": 2.535377358490566, "percentage": 12.68, "elapsed_time": "0:07:55", "remaining_time": "0:54:36", "throughput": 5891.59, "total_tokens": 2802672} {"current_steps": 4305, "total_steps": 33920, "loss": 0.5498, "lr": 9.977995377734307e-06, "epoch": 2.538325471698113, "percentage": 12.69, "elapsed_time": "0:07:56", "remaining_time": "0:54:35", "throughput": 5891.09, "total_tokens": 2805360} {"current_steps": 4310, "total_steps": 33920, "loss": 0.3648, "lr": 9.977753617150061e-06, "epoch": 2.5412735849056602, "percentage": 12.71, "elapsed_time": "0:07:56", "remaining_time": "0:54:35", "throughput": 5891.88, "total_tokens": 2809040} {"current_steps": 4315, "total_steps": 33920, "loss": 0.5923, "lr": 9.977510538684094e-06, "epoch": 2.5442216981132075, "percentage": 12.72, "elapsed_time": "0:07:57", "remaining_time": "0:54:34", "throughput": 5892.03, "total_tokens": 2812080} {"current_steps": 4320, "total_steps": 33920, "loss": 0.5526, "lr": 9.977266142400757e-06, "epoch": 2.547169811320755, "percentage": 12.74, "elapsed_time": "0:07:57", "remaining_time": "0:54:34", "throughput": 5892.66, "total_tokens": 2816400} {"current_steps": 4325, "total_steps": 33920, "loss": 0.5813, "lr": 9.977020428364759e-06, "epoch": 2.550117924528302, "percentage": 12.75, "elapsed_time": "0:07:58", "remaining_time": "0:54:34", "throughput": 5893.62, "total_tokens": 2820144} {"current_steps": 4330, "total_steps": 33920, "loss": 0.4183, "lr": 9.976773396641154e-06, "epoch": 2.553066037735849, "percentage": 12.77, "elapsed_time": "0:07:59", "remaining_time": "0:54:33", "throughput": 5893.9, "total_tokens": 2823184} {"current_steps": 4335, "total_steps": 33920, "loss": 0.3819, "lr": 9.976525047295342e-06, "epoch": 2.5560141509433962, "percentage": 12.78, "elapsed_time": "0:07:59", "remaining_time": "0:54:32", "throughput": 5893.77, "total_tokens": 2826320} {"current_steps": 4340, "total_steps": 33920, "loss": 0.4535, "lr": 9.976275380393077e-06, "epoch": 2.5589622641509435, "percentage": 12.79, "elapsed_time": "0:08:00", "remaining_time": "0:54:33", "throughput": 5894.76, "total_tokens": 2830928} {"current_steps": 4345, "total_steps": 33920, "loss": 0.5383, "lr": 9.976024396000459e-06, "epoch": 2.5619103773584904, "percentage": 12.81, "elapsed_time": "0:08:00", "remaining_time": "0:54:32", "throughput": 5894.99, "total_tokens": 2833968} {"current_steps": 4350, "total_steps": 33920, "loss": 0.5048, "lr": 9.975772094183935e-06, "epoch": 2.5648584905660377, "percentage": 12.82, "elapsed_time": "0:08:01", "remaining_time": "0:54:31", "throughput": 5895.43, "total_tokens": 2837392} {"current_steps": 4355, "total_steps": 33920, "loss": 0.5276, "lr": 9.975518475010306e-06, "epoch": 2.567806603773585, "percentage": 12.84, "elapsed_time": "0:08:01", "remaining_time": "0:54:30", "throughput": 5894.96, "total_tokens": 2840048} {"current_steps": 4360, "total_steps": 33920, "loss": 0.4091, "lr": 9.975263538546717e-06, "epoch": 2.5707547169811322, "percentage": 12.85, "elapsed_time": "0:08:02", "remaining_time": "0:54:29", "throughput": 5894.56, "total_tokens": 2842768} {"current_steps": 4365, "total_steps": 33920, "loss": 0.531, "lr": 9.975007284860664e-06, "epoch": 2.5737028301886795, "percentage": 12.87, "elapsed_time": "0:08:02", "remaining_time": "0:54:29", "throughput": 5895.33, "total_tokens": 2846512} {"current_steps": 4370, "total_steps": 33920, "loss": 0.6445, "lr": 9.974749714019993e-06, "epoch": 2.5766509433962264, "percentage": 12.88, "elapsed_time": "0:08:03", "remaining_time": "0:54:28", "throughput": 5895.48, "total_tokens": 2849808} {"current_steps": 4375, "total_steps": 33920, "loss": 0.4806, "lr": 9.974490826092894e-06, "epoch": 2.5795990566037736, "percentage": 12.9, "elapsed_time": "0:08:03", "remaining_time": "0:54:28", "throughput": 5895.8, "total_tokens": 2853360} {"current_steps": 4380, "total_steps": 33920, "loss": 0.4182, "lr": 9.974230621147907e-06, "epoch": 2.5825471698113205, "percentage": 12.91, "elapsed_time": "0:08:04", "remaining_time": "0:54:28", "throughput": 5896.38, "total_tokens": 2857296} {"current_steps": 4385, "total_steps": 33920, "loss": 0.5549, "lr": 9.973969099253928e-06, "epoch": 2.5854952830188678, "percentage": 12.93, "elapsed_time": "0:08:05", "remaining_time": "0:54:27", "throughput": 5897.44, "total_tokens": 2861136} {"current_steps": 4390, "total_steps": 33920, "loss": 0.4759, "lr": 9.973706260480194e-06, "epoch": 2.588443396226415, "percentage": 12.94, "elapsed_time": "0:08:05", "remaining_time": "0:54:26", "throughput": 5897.26, "total_tokens": 2863888} {"current_steps": 4395, "total_steps": 33920, "loss": 0.5552, "lr": 9.97344210489629e-06, "epoch": 2.5913915094339623, "percentage": 12.96, "elapsed_time": "0:08:06", "remaining_time": "0:54:26", "throughput": 5897.73, "total_tokens": 2867504} {"current_steps": 4400, "total_steps": 33920, "loss": 0.47, "lr": 9.973176632572158e-06, "epoch": 2.5943396226415096, "percentage": 12.97, "elapsed_time": "0:08:06", "remaining_time": "0:54:26", "throughput": 5897.36, "total_tokens": 2871056} {"current_steps": 4405, "total_steps": 33920, "loss": 0.5567, "lr": 9.972909843578076e-06, "epoch": 2.5972877358490565, "percentage": 12.99, "elapsed_time": "0:08:07", "remaining_time": "0:54:25", "throughput": 5896.3, "total_tokens": 2873712} {"current_steps": 4410, "total_steps": 33920, "loss": 0.6168, "lr": 9.972641737984681e-06, "epoch": 2.6002358490566038, "percentage": 13.0, "elapsed_time": "0:08:07", "remaining_time": "0:54:24", "throughput": 5896.07, "total_tokens": 2876720} {"current_steps": 4415, "total_steps": 33920, "loss": 0.478, "lr": 9.972372315862956e-06, "epoch": 2.603183962264151, "percentage": 13.02, "elapsed_time": "0:08:08", "remaining_time": "0:54:24", "throughput": 5895.51, "total_tokens": 2879664} {"current_steps": 4420, "total_steps": 33920, "loss": 0.4594, "lr": 9.97210157728423e-06, "epoch": 2.606132075471698, "percentage": 13.03, "elapsed_time": "0:08:08", "remaining_time": "0:54:23", "throughput": 5895.43, "total_tokens": 2882704} {"current_steps": 4425, "total_steps": 33920, "loss": 0.3238, "lr": 9.971829522320185e-06, "epoch": 2.609080188679245, "percentage": 13.05, "elapsed_time": "0:08:10", "remaining_time": "0:54:26", "throughput": 5897.67, "total_tokens": 2890448} {"current_steps": 4430, "total_steps": 33920, "loss": 0.4571, "lr": 9.971556151042843e-06, "epoch": 2.6120283018867925, "percentage": 13.06, "elapsed_time": "0:08:10", "remaining_time": "0:54:25", "throughput": 5897.59, "total_tokens": 2893424} {"current_steps": 4435, "total_steps": 33920, "loss": 0.5833, "lr": 9.971281463524588e-06, "epoch": 2.6149764150943398, "percentage": 13.07, "elapsed_time": "0:08:11", "remaining_time": "0:54:27", "throughput": 5899.08, "total_tokens": 2899600} {"current_steps": 4440, "total_steps": 33920, "loss": 0.4556, "lr": 9.971005459838136e-06, "epoch": 2.617924528301887, "percentage": 13.09, "elapsed_time": "0:08:12", "remaining_time": "0:54:27", "throughput": 5899.93, "total_tokens": 2903600} {"current_steps": 4445, "total_steps": 33920, "loss": 0.5396, "lr": 9.970728140056567e-06, "epoch": 2.620872641509434, "percentage": 13.1, "elapsed_time": "0:08:12", "remaining_time": "0:54:26", "throughput": 5900.54, "total_tokens": 2907088} {"current_steps": 4450, "total_steps": 33920, "loss": 0.4049, "lr": 9.9704495042533e-06, "epoch": 2.623820754716981, "percentage": 13.12, "elapsed_time": "0:08:13", "remaining_time": "0:54:26", "throughput": 5900.57, "total_tokens": 2910672} {"current_steps": 4455, "total_steps": 33920, "loss": 0.5402, "lr": 9.970169552502105e-06, "epoch": 2.6267688679245285, "percentage": 13.13, "elapsed_time": "0:08:13", "remaining_time": "0:54:25", "throughput": 5899.72, "total_tokens": 2913008} {"current_steps": 4460, "total_steps": 33920, "loss": 0.5486, "lr": 9.969888284877102e-06, "epoch": 2.6297169811320753, "percentage": 13.15, "elapsed_time": "0:08:14", "remaining_time": "0:54:25", "throughput": 5899.81, "total_tokens": 2916240} {"current_steps": 4465, "total_steps": 33920, "loss": 0.3449, "lr": 9.969605701452757e-06, "epoch": 2.6326650943396226, "percentage": 13.16, "elapsed_time": "0:08:14", "remaining_time": "0:54:24", "throughput": 5900.0, "total_tokens": 2919408} {"current_steps": 4470, "total_steps": 33920, "loss": 0.4772, "lr": 9.969321802303882e-06, "epoch": 2.63561320754717, "percentage": 13.18, "elapsed_time": "0:08:15", "remaining_time": "0:54:23", "throughput": 5899.56, "total_tokens": 2922224} {"current_steps": 4475, "total_steps": 33920, "loss": 0.4397, "lr": 9.969036587505644e-06, "epoch": 2.638561320754717, "percentage": 13.19, "elapsed_time": "0:08:15", "remaining_time": "0:54:22", "throughput": 5899.89, "total_tokens": 2925616} {"current_steps": 4480, "total_steps": 33920, "loss": 0.3676, "lr": 9.968750057133555e-06, "epoch": 2.641509433962264, "percentage": 13.21, "elapsed_time": "0:08:16", "remaining_time": "0:54:21", "throughput": 5899.69, "total_tokens": 2928304} {"current_steps": 4485, "total_steps": 33920, "loss": 0.5841, "lr": 9.968462211263474e-06, "epoch": 2.6444575471698113, "percentage": 13.22, "elapsed_time": "0:08:16", "remaining_time": "0:54:20", "throughput": 5899.77, "total_tokens": 2931440} {"current_steps": 4490, "total_steps": 33920, "loss": 0.3536, "lr": 9.96817304997161e-06, "epoch": 2.6474056603773586, "percentage": 13.24, "elapsed_time": "0:08:17", "remaining_time": "0:54:20", "throughput": 5899.45, "total_tokens": 2934416} {"current_steps": 4495, "total_steps": 33920, "loss": 0.5362, "lr": 9.967882573334519e-06, "epoch": 2.6503537735849054, "percentage": 13.25, "elapsed_time": "0:08:17", "remaining_time": "0:54:19", "throughput": 5898.32, "total_tokens": 2936912} {"current_steps": 4500, "total_steps": 33920, "loss": 0.4731, "lr": 9.967590781429106e-06, "epoch": 2.6533018867924527, "percentage": 13.27, "elapsed_time": "0:08:18", "remaining_time": "0:54:19", "throughput": 5899.28, "total_tokens": 2940912} {"current_steps": 4505, "total_steps": 33920, "loss": 0.5464, "lr": 9.967297674332625e-06, "epoch": 2.65625, "percentage": 13.28, "elapsed_time": "0:08:19", "remaining_time": "0:54:18", "throughput": 5899.48, "total_tokens": 2944336} {"current_steps": 4510, "total_steps": 33920, "loss": 0.4632, "lr": 9.967003252122675e-06, "epoch": 2.6591981132075473, "percentage": 13.3, "elapsed_time": "0:08:19", "remaining_time": "0:54:18", "throughput": 5900.32, "total_tokens": 2948208} {"current_steps": 4515, "total_steps": 33920, "loss": 0.5545, "lr": 9.96670751487721e-06, "epoch": 2.6621462264150946, "percentage": 13.31, "elapsed_time": "0:08:20", "remaining_time": "0:54:17", "throughput": 5900.46, "total_tokens": 2951088} {"current_steps": 4520, "total_steps": 33920, "loss": 0.4656, "lr": 9.966410462674525e-06, "epoch": 2.6650943396226414, "percentage": 13.33, "elapsed_time": "0:08:20", "remaining_time": "0:54:16", "throughput": 5900.42, "total_tokens": 2954000} {"current_steps": 4525, "total_steps": 33920, "loss": 0.4189, "lr": 9.966112095593264e-06, "epoch": 2.6680424528301887, "percentage": 13.34, "elapsed_time": "0:08:21", "remaining_time": "0:54:15", "throughput": 5899.87, "total_tokens": 2956624} {"current_steps": 4530, "total_steps": 33920, "loss": 0.5658, "lr": 9.965812413712425e-06, "epoch": 2.670990566037736, "percentage": 13.35, "elapsed_time": "0:08:21", "remaining_time": "0:54:14", "throughput": 5900.07, "total_tokens": 2959568} {"current_steps": 4535, "total_steps": 33920, "loss": 0.5916, "lr": 9.965511417111346e-06, "epoch": 2.673938679245283, "percentage": 13.37, "elapsed_time": "0:08:22", "remaining_time": "0:54:13", "throughput": 5900.25, "total_tokens": 2962928} {"current_steps": 4540, "total_steps": 33920, "loss": 0.509, "lr": 9.96520910586972e-06, "epoch": 2.67688679245283, "percentage": 13.38, "elapsed_time": "0:08:22", "remaining_time": "0:54:13", "throughput": 5900.78, "total_tokens": 2966352} {"current_steps": 4545, "total_steps": 33920, "loss": 0.3752, "lr": 9.964905480067585e-06, "epoch": 2.6798349056603774, "percentage": 13.4, "elapsed_time": "0:08:23", "remaining_time": "0:54:12", "throughput": 5900.96, "total_tokens": 2969584} {"current_steps": 4550, "total_steps": 33920, "loss": 0.3916, "lr": 9.964600539785328e-06, "epoch": 2.6827830188679247, "percentage": 13.41, "elapsed_time": "0:08:23", "remaining_time": "0:54:11", "throughput": 5900.25, "total_tokens": 2972016} {"current_steps": 4555, "total_steps": 33920, "loss": 0.6724, "lr": 9.96429428510368e-06, "epoch": 2.6857311320754715, "percentage": 13.43, "elapsed_time": "0:08:24", "remaining_time": "0:54:10", "throughput": 5900.16, "total_tokens": 2974800} {"current_steps": 4560, "total_steps": 33920, "loss": 0.4719, "lr": 9.963986716103724e-06, "epoch": 2.688679245283019, "percentage": 13.44, "elapsed_time": "0:08:24", "remaining_time": "0:54:09", "throughput": 5898.75, "total_tokens": 2977136} {"current_steps": 4565, "total_steps": 33920, "loss": 0.4485, "lr": 9.963677832866893e-06, "epoch": 2.691627358490566, "percentage": 13.46, "elapsed_time": "0:08:25", "remaining_time": "0:54:08", "throughput": 5898.44, "total_tokens": 2979888} {"current_steps": 4570, "total_steps": 33920, "loss": 0.572, "lr": 9.963367635474962e-06, "epoch": 2.694575471698113, "percentage": 13.47, "elapsed_time": "0:08:25", "remaining_time": "0:54:07", "throughput": 5898.86, "total_tokens": 2983248} {"current_steps": 4575, "total_steps": 33920, "loss": 0.5488, "lr": 9.96305612401006e-06, "epoch": 2.6975235849056602, "percentage": 13.49, "elapsed_time": "0:08:26", "remaining_time": "0:54:07", "throughput": 5898.73, "total_tokens": 2986320} {"current_steps": 4580, "total_steps": 33920, "loss": 0.6084, "lr": 9.96274329855466e-06, "epoch": 2.7004716981132075, "percentage": 13.5, "elapsed_time": "0:08:26", "remaining_time": "0:54:06", "throughput": 5898.87, "total_tokens": 2989392} {"current_steps": 4585, "total_steps": 33920, "loss": 0.5299, "lr": 9.962429159191583e-06, "epoch": 2.703419811320755, "percentage": 13.52, "elapsed_time": "0:08:27", "remaining_time": "0:54:05", "throughput": 5898.47, "total_tokens": 2992400} {"current_steps": 4590, "total_steps": 33920, "loss": 0.4753, "lr": 9.962113706003997e-06, "epoch": 2.706367924528302, "percentage": 13.53, "elapsed_time": "0:08:27", "remaining_time": "0:54:04", "throughput": 5897.96, "total_tokens": 2995056} {"current_steps": 4595, "total_steps": 33920, "loss": 0.5708, "lr": 9.961796939075424e-06, "epoch": 2.709316037735849, "percentage": 13.55, "elapsed_time": "0:08:28", "remaining_time": "0:54:04", "throughput": 5898.33, "total_tokens": 2998352} {"current_steps": 4600, "total_steps": 33920, "loss": 0.4354, "lr": 9.961478858489728e-06, "epoch": 2.7122641509433962, "percentage": 13.56, "elapsed_time": "0:08:28", "remaining_time": "0:54:04", "throughput": 5898.91, "total_tokens": 3002256} {"current_steps": 4605, "total_steps": 33920, "loss": 0.5572, "lr": 9.961159464331119e-06, "epoch": 2.7152122641509435, "percentage": 13.58, "elapsed_time": "0:08:29", "remaining_time": "0:54:02", "throughput": 5898.77, "total_tokens": 3005008} {"current_steps": 4610, "total_steps": 33920, "loss": 0.4895, "lr": 9.960838756684161e-06, "epoch": 2.7181603773584904, "percentage": 13.59, "elapsed_time": "0:08:29", "remaining_time": "0:54:02", "throughput": 5899.16, "total_tokens": 3008272} {"current_steps": 4615, "total_steps": 33920, "loss": 0.5084, "lr": 9.960516735633764e-06, "epoch": 2.7211084905660377, "percentage": 13.61, "elapsed_time": "0:08:30", "remaining_time": "0:54:01", "throughput": 5898.96, "total_tokens": 3010864} {"current_steps": 4620, "total_steps": 33920, "loss": 0.5067, "lr": 9.960193401265181e-06, "epoch": 2.724056603773585, "percentage": 13.62, "elapsed_time": "0:08:30", "remaining_time": "0:54:00", "throughput": 5898.67, "total_tokens": 3013872} {"current_steps": 4625, "total_steps": 33920, "loss": 0.6774, "lr": 9.959868753664018e-06, "epoch": 2.7270047169811322, "percentage": 13.64, "elapsed_time": "0:08:31", "remaining_time": "0:53:59", "throughput": 5898.84, "total_tokens": 3016912} {"current_steps": 4630, "total_steps": 33920, "loss": 0.5242, "lr": 9.959542792916227e-06, "epoch": 2.7299528301886795, "percentage": 13.65, "elapsed_time": "0:08:31", "remaining_time": "0:53:58", "throughput": 5899.23, "total_tokens": 3020272} {"current_steps": 4635, "total_steps": 33920, "loss": 0.3996, "lr": 9.959215519108108e-06, "epoch": 2.7329009433962264, "percentage": 13.66, "elapsed_time": "0:08:32", "remaining_time": "0:53:58", "throughput": 5899.95, "total_tokens": 3024208} {"current_steps": 4640, "total_steps": 33920, "loss": 0.5381, "lr": 9.958886932326306e-06, "epoch": 2.7358490566037736, "percentage": 13.68, "elapsed_time": "0:08:33", "remaining_time": "0:53:57", "throughput": 5899.63, "total_tokens": 3026960} {"current_steps": 4645, "total_steps": 33920, "loss": 0.6327, "lr": 9.958557032657817e-06, "epoch": 2.7387971698113205, "percentage": 13.69, "elapsed_time": "0:08:33", "remaining_time": "0:53:56", "throughput": 5898.6, "total_tokens": 3029424} {"current_steps": 4650, "total_steps": 33920, "loss": 0.5178, "lr": 9.958225820189984e-06, "epoch": 2.7417452830188678, "percentage": 13.71, "elapsed_time": "0:08:34", "remaining_time": "0:53:56", "throughput": 5899.66, "total_tokens": 3033424} {"current_steps": 4655, "total_steps": 33920, "loss": 0.4539, "lr": 9.957893295010495e-06, "epoch": 2.744693396226415, "percentage": 13.72, "elapsed_time": "0:08:34", "remaining_time": "0:53:55", "throughput": 5899.67, "total_tokens": 3036112} {"current_steps": 4660, "total_steps": 33920, "loss": 0.4823, "lr": 9.957559457207391e-06, "epoch": 2.7476415094339623, "percentage": 13.74, "elapsed_time": "0:08:35", "remaining_time": "0:53:56", "throughput": 5900.76, "total_tokens": 3041872} {"current_steps": 4665, "total_steps": 33920, "loss": 0.5121, "lr": 9.957224306869053e-06, "epoch": 2.7505896226415096, "percentage": 13.75, "elapsed_time": "0:08:35", "remaining_time": "0:53:55", "throughput": 5900.72, "total_tokens": 3044720} {"current_steps": 4670, "total_steps": 33920, "loss": 0.4737, "lr": 9.956887844084216e-06, "epoch": 2.7535377358490565, "percentage": 13.77, "elapsed_time": "0:08:36", "remaining_time": "0:53:54", "throughput": 5900.53, "total_tokens": 3047440} {"current_steps": 4675, "total_steps": 33920, "loss": 0.4098, "lr": 9.956550068941958e-06, "epoch": 2.7564858490566038, "percentage": 13.78, "elapsed_time": "0:08:36", "remaining_time": "0:53:53", "throughput": 5900.36, "total_tokens": 3050256} {"current_steps": 4680, "total_steps": 33920, "loss": 0.4572, "lr": 9.95621098153171e-06, "epoch": 2.759433962264151, "percentage": 13.8, "elapsed_time": "0:08:37", "remaining_time": "0:53:53", "throughput": 5900.93, "total_tokens": 3053552} {"current_steps": 4685, "total_steps": 33920, "loss": 0.4695, "lr": 9.955870581943243e-06, "epoch": 2.762382075471698, "percentage": 13.81, "elapsed_time": "0:08:37", "remaining_time": "0:53:52", "throughput": 5900.23, "total_tokens": 3056304} {"current_steps": 4690, "total_steps": 33920, "loss": 0.5201, "lr": 9.955528870266681e-06, "epoch": 2.765330188679245, "percentage": 13.83, "elapsed_time": "0:08:38", "remaining_time": "0:53:51", "throughput": 5899.64, "total_tokens": 3058960} {"current_steps": 4695, "total_steps": 33920, "loss": 0.324, "lr": 9.955185846592495e-06, "epoch": 2.7682783018867925, "percentage": 13.84, "elapsed_time": "0:08:38", "remaining_time": "0:53:50", "throughput": 5899.41, "total_tokens": 3061616} {"current_steps": 4700, "total_steps": 33920, "loss": 0.3864, "lr": 9.9548415110115e-06, "epoch": 2.7712264150943398, "percentage": 13.86, "elapsed_time": "0:08:39", "remaining_time": "0:53:49", "throughput": 5899.49, "total_tokens": 3064880} {"current_steps": 4705, "total_steps": 33920, "loss": 0.4798, "lr": 9.95449586361486e-06, "epoch": 2.774174528301887, "percentage": 13.87, "elapsed_time": "0:08:39", "remaining_time": "0:53:48", "throughput": 5899.38, "total_tokens": 3067664} {"current_steps": 4710, "total_steps": 33920, "loss": 0.5824, "lr": 9.954148904494085e-06, "epoch": 2.777122641509434, "percentage": 13.89, "elapsed_time": "0:08:40", "remaining_time": "0:53:47", "throughput": 5898.65, "total_tokens": 3070064} {"current_steps": 4715, "total_steps": 33920, "loss": 0.5195, "lr": 9.95380063374104e-06, "epoch": 2.780070754716981, "percentage": 13.9, "elapsed_time": "0:08:40", "remaining_time": "0:53:47", "throughput": 5898.09, "total_tokens": 3072848} {"current_steps": 4720, "total_steps": 33920, "loss": 0.5824, "lr": 9.953451051447927e-06, "epoch": 2.7830188679245285, "percentage": 13.92, "elapsed_time": "0:08:41", "remaining_time": "0:53:47", "throughput": 5898.94, "total_tokens": 3077168} {"current_steps": 4725, "total_steps": 33920, "loss": 0.5513, "lr": 9.953100157707299e-06, "epoch": 2.7859669811320753, "percentage": 13.93, "elapsed_time": "0:08:42", "remaining_time": "0:53:46", "throughput": 5899.19, "total_tokens": 3080496} {"current_steps": 4730, "total_steps": 33920, "loss": 0.6045, "lr": 9.952747952612056e-06, "epoch": 2.7889150943396226, "percentage": 13.94, "elapsed_time": "0:08:42", "remaining_time": "0:53:45", "throughput": 5897.29, "total_tokens": 3082608} {"current_steps": 4735, "total_steps": 33920, "loss": 0.6115, "lr": 9.952394436255451e-06, "epoch": 2.79186320754717, "percentage": 13.96, "elapsed_time": "0:08:43", "remaining_time": "0:53:45", "throughput": 5897.83, "total_tokens": 3086128} {"current_steps": 4740, "total_steps": 33920, "loss": 0.5221, "lr": 9.952039608731072e-06, "epoch": 2.794811320754717, "percentage": 13.97, "elapsed_time": "0:08:43", "remaining_time": "0:53:44", "throughput": 5898.35, "total_tokens": 3089424} {"current_steps": 4745, "total_steps": 33920, "loss": 0.4511, "lr": 9.951683470132868e-06, "epoch": 2.797759433962264, "percentage": 13.99, "elapsed_time": "0:08:44", "remaining_time": "0:53:43", "throughput": 5898.38, "total_tokens": 3092528} {"current_steps": 4750, "total_steps": 33920, "loss": 0.5285, "lr": 9.951326020555122e-06, "epoch": 2.8007075471698113, "percentage": 14.0, "elapsed_time": "0:08:44", "remaining_time": "0:53:42", "throughput": 5898.64, "total_tokens": 3095696} {"current_steps": 4755, "total_steps": 33920, "loss": 0.5104, "lr": 9.950967260092473e-06, "epoch": 2.8036556603773586, "percentage": 14.02, "elapsed_time": "0:08:45", "remaining_time": "0:53:42", "throughput": 5898.56, "total_tokens": 3098928} {"current_steps": 4760, "total_steps": 33920, "loss": 0.538, "lr": 9.950607188839905e-06, "epoch": 2.8066037735849054, "percentage": 14.03, "elapsed_time": "0:08:45", "remaining_time": "0:53:42", "throughput": 5899.61, "total_tokens": 3103024} {"current_steps": 4765, "total_steps": 33920, "loss": 0.4575, "lr": 9.950245806892749e-06, "epoch": 2.8095518867924527, "percentage": 14.05, "elapsed_time": "0:08:46", "remaining_time": "0:53:41", "throughput": 5900.1, "total_tokens": 3106480} {"current_steps": 4770, "total_steps": 33920, "loss": 0.4051, "lr": 9.94988311434668e-06, "epoch": 2.8125, "percentage": 14.06, "elapsed_time": "0:08:47", "remaining_time": "0:53:40", "throughput": 5900.29, "total_tokens": 3109840} {"current_steps": 4775, "total_steps": 33920, "loss": 0.4717, "lr": 9.949519111297723e-06, "epoch": 2.8154481132075473, "percentage": 14.08, "elapsed_time": "0:08:47", "remaining_time": "0:53:40", "throughput": 5900.74, "total_tokens": 3113072} {"current_steps": 4780, "total_steps": 33920, "loss": 0.4592, "lr": 9.949153797842252e-06, "epoch": 2.8183962264150946, "percentage": 14.09, "elapsed_time": "0:08:48", "remaining_time": "0:53:39", "throughput": 5900.58, "total_tokens": 3116304} {"current_steps": 4785, "total_steps": 33920, "loss": 0.4717, "lr": 9.948787174076982e-06, "epoch": 2.8213443396226414, "percentage": 14.11, "elapsed_time": "0:08:48", "remaining_time": "0:53:38", "throughput": 5900.4, "total_tokens": 3119152} {"current_steps": 4790, "total_steps": 33920, "loss": 0.4545, "lr": 9.948419240098978e-06, "epoch": 2.8242924528301887, "percentage": 14.12, "elapsed_time": "0:08:49", "remaining_time": "0:53:37", "throughput": 5900.57, "total_tokens": 3122160} {"current_steps": 4795, "total_steps": 33920, "loss": 0.3353, "lr": 9.948049996005657e-06, "epoch": 2.827240566037736, "percentage": 14.14, "elapsed_time": "0:08:49", "remaining_time": "0:53:36", "throughput": 5901.0, "total_tokens": 3125296} {"current_steps": 4800, "total_steps": 33920, "loss": 0.4559, "lr": 9.947679441894773e-06, "epoch": 2.830188679245283, "percentage": 14.15, "elapsed_time": "0:08:50", "remaining_time": "0:53:36", "throughput": 5901.42, "total_tokens": 3128496} {"current_steps": 4805, "total_steps": 33920, "loss": 0.5985, "lr": 9.947307577864433e-06, "epoch": 2.83313679245283, "percentage": 14.17, "elapsed_time": "0:08:50", "remaining_time": "0:53:35", "throughput": 5902.15, "total_tokens": 3132272} {"current_steps": 4810, "total_steps": 33920, "loss": 0.5325, "lr": 9.94693440401309e-06, "epoch": 2.8360849056603774, "percentage": 14.18, "elapsed_time": "0:08:51", "remaining_time": "0:53:34", "throughput": 5902.31, "total_tokens": 3135280} {"current_steps": 4815, "total_steps": 33920, "loss": 0.4734, "lr": 9.946559920439545e-06, "epoch": 2.8390330188679247, "percentage": 14.2, "elapsed_time": "0:08:51", "remaining_time": "0:53:33", "throughput": 5902.57, "total_tokens": 3138352} {"current_steps": 4820, "total_steps": 33920, "loss": 0.4258, "lr": 9.946184127242942e-06, "epoch": 2.8419811320754715, "percentage": 14.21, "elapsed_time": "0:08:52", "remaining_time": "0:53:33", "throughput": 5902.97, "total_tokens": 3141520} {"current_steps": 4825, "total_steps": 33920, "loss": 0.3801, "lr": 9.945807024522774e-06, "epoch": 2.844929245283019, "percentage": 14.22, "elapsed_time": "0:08:52", "remaining_time": "0:53:31", "throughput": 5902.56, "total_tokens": 3143952} {"current_steps": 4830, "total_steps": 33920, "loss": 0.5233, "lr": 9.945428612378881e-06, "epoch": 2.847877358490566, "percentage": 14.24, "elapsed_time": "0:08:53", "remaining_time": "0:53:30", "throughput": 5902.26, "total_tokens": 3146736} {"current_steps": 4835, "total_steps": 33920, "loss": 0.6951, "lr": 9.94504889091145e-06, "epoch": 2.850825471698113, "percentage": 14.25, "elapsed_time": "0:08:53", "remaining_time": "0:53:29", "throughput": 5901.61, "total_tokens": 3148944} {"current_steps": 4840, "total_steps": 33920, "loss": 0.4822, "lr": 9.944667860221013e-06, "epoch": 2.8537735849056602, "percentage": 14.27, "elapsed_time": "0:08:54", "remaining_time": "0:53:29", "throughput": 5902.19, "total_tokens": 3152432} {"current_steps": 4845, "total_steps": 33920, "loss": 0.4719, "lr": 9.944285520408448e-06, "epoch": 2.8567216981132075, "percentage": 14.28, "elapsed_time": "0:08:54", "remaining_time": "0:53:29", "throughput": 5902.96, "total_tokens": 3156688} {"current_steps": 4850, "total_steps": 33920, "loss": 0.4947, "lr": 9.943901871574984e-06, "epoch": 2.859669811320755, "percentage": 14.3, "elapsed_time": "0:08:55", "remaining_time": "0:53:28", "throughput": 5902.91, "total_tokens": 3159408} {"current_steps": 4855, "total_steps": 33920, "loss": 0.5738, "lr": 9.943516913822192e-06, "epoch": 2.862617924528302, "percentage": 14.31, "elapsed_time": "0:08:55", "remaining_time": "0:53:27", "throughput": 5903.65, "total_tokens": 3163248} {"current_steps": 4860, "total_steps": 33920, "loss": 0.4385, "lr": 9.943130647251994e-06, "epoch": 2.865566037735849, "percentage": 14.33, "elapsed_time": "0:08:56", "remaining_time": "0:53:26", "throughput": 5903.11, "total_tokens": 3165584} {"current_steps": 4865, "total_steps": 33920, "loss": 0.3143, "lr": 9.94274307196665e-06, "epoch": 2.8685141509433962, "percentage": 14.34, "elapsed_time": "0:08:56", "remaining_time": "0:53:25", "throughput": 5903.37, "total_tokens": 3168656} {"current_steps": 4870, "total_steps": 33920, "loss": 0.363, "lr": 9.942354188068778e-06, "epoch": 2.8714622641509435, "percentage": 14.36, "elapsed_time": "0:08:57", "remaining_time": "0:53:24", "throughput": 5903.95, "total_tokens": 3172048} {"current_steps": 4875, "total_steps": 33920, "loss": 0.6071, "lr": 9.941963995661333e-06, "epoch": 2.8744103773584904, "percentage": 14.37, "elapsed_time": "0:08:57", "remaining_time": "0:53:23", "throughput": 5904.05, "total_tokens": 3174896} {"current_steps": 4880, "total_steps": 33920, "loss": 0.5665, "lr": 9.941572494847622e-06, "epoch": 2.8773584905660377, "percentage": 14.39, "elapsed_time": "0:08:58", "remaining_time": "0:53:22", "throughput": 5903.5, "total_tokens": 3177488} {"current_steps": 4885, "total_steps": 33920, "loss": 0.454, "lr": 9.941179685731297e-06, "epoch": 2.880306603773585, "percentage": 14.4, "elapsed_time": "0:08:58", "remaining_time": "0:53:21", "throughput": 5902.38, "total_tokens": 3179440} {"current_steps": 4890, "total_steps": 33920, "loss": 0.4224, "lr": 9.940785568416354e-06, "epoch": 2.8832547169811322, "percentage": 14.42, "elapsed_time": "0:08:59", "remaining_time": "0:53:21", "throughput": 5902.74, "total_tokens": 3182896} {"current_steps": 4895, "total_steps": 33920, "loss": 0.4948, "lr": 9.940390143007137e-06, "epoch": 2.8862028301886795, "percentage": 14.43, "elapsed_time": "0:08:59", "remaining_time": "0:53:20", "throughput": 5903.18, "total_tokens": 3186320} {"current_steps": 4900, "total_steps": 33920, "loss": 0.5518, "lr": 9.939993409608339e-06, "epoch": 2.8891509433962264, "percentage": 14.45, "elapsed_time": "0:09:00", "remaining_time": "0:53:19", "throughput": 5903.41, "total_tokens": 3189200} {"current_steps": 4905, "total_steps": 33920, "loss": 0.474, "lr": 9.939595368324996e-06, "epoch": 2.8920990566037736, "percentage": 14.46, "elapsed_time": "0:09:00", "remaining_time": "0:53:19", "throughput": 5904.25, "total_tokens": 3193104} {"current_steps": 4910, "total_steps": 33920, "loss": 0.3859, "lr": 9.93919601926249e-06, "epoch": 2.8950471698113205, "percentage": 14.48, "elapsed_time": "0:09:01", "remaining_time": "0:53:18", "throughput": 5904.3, "total_tokens": 3195920} {"current_steps": 4915, "total_steps": 33920, "loss": 0.4464, "lr": 9.938795362526552e-06, "epoch": 2.8979952830188678, "percentage": 14.49, "elapsed_time": "0:09:02", "remaining_time": "0:53:18", "throughput": 5905.4, "total_tokens": 3200848} {"current_steps": 4920, "total_steps": 33920, "loss": 0.474, "lr": 9.938393398223255e-06, "epoch": 2.900943396226415, "percentage": 14.5, "elapsed_time": "0:09:02", "remaining_time": "0:53:17", "throughput": 5905.73, "total_tokens": 3203984} {"current_steps": 4925, "total_steps": 33920, "loss": 0.4361, "lr": 9.937990126459024e-06, "epoch": 2.9038915094339623, "percentage": 14.52, "elapsed_time": "0:09:03", "remaining_time": "0:53:17", "throughput": 5906.29, "total_tokens": 3207824} {"current_steps": 4930, "total_steps": 33920, "loss": 0.5225, "lr": 9.937585547340624e-06, "epoch": 2.9068396226415096, "percentage": 14.53, "elapsed_time": "0:09:03", "remaining_time": "0:53:16", "throughput": 5906.61, "total_tokens": 3210992} {"current_steps": 4935, "total_steps": 33920, "loss": 0.3623, "lr": 9.937179660975174e-06, "epoch": 2.9097877358490565, "percentage": 14.55, "elapsed_time": "0:09:04", "remaining_time": "0:53:16", "throughput": 5907.17, "total_tokens": 3214544} {"current_steps": 4940, "total_steps": 33920, "loss": 0.4696, "lr": 9.936772467470127e-06, "epoch": 2.9127358490566038, "percentage": 14.56, "elapsed_time": "0:09:04", "remaining_time": "0:53:15", "throughput": 5907.14, "total_tokens": 3217424} {"current_steps": 4945, "total_steps": 33920, "loss": 0.6843, "lr": 9.936363966933294e-06, "epoch": 2.915683962264151, "percentage": 14.58, "elapsed_time": "0:09:05", "remaining_time": "0:53:14", "throughput": 5907.39, "total_tokens": 3220400} {"current_steps": 4950, "total_steps": 33920, "loss": 0.375, "lr": 9.935954159472828e-06, "epoch": 2.918632075471698, "percentage": 14.59, "elapsed_time": "0:09:05", "remaining_time": "0:53:13", "throughput": 5907.75, "total_tokens": 3223408} {"current_steps": 4955, "total_steps": 33920, "loss": 0.418, "lr": 9.935543045197222e-06, "epoch": 2.921580188679245, "percentage": 14.61, "elapsed_time": "0:09:06", "remaining_time": "0:53:12", "throughput": 5907.67, "total_tokens": 3226288} {"current_steps": 4960, "total_steps": 33920, "loss": 0.5549, "lr": 9.935130624215326e-06, "epoch": 2.9245283018867925, "percentage": 14.62, "elapsed_time": "0:09:06", "remaining_time": "0:53:11", "throughput": 5907.8, "total_tokens": 3229296} {"current_steps": 4965, "total_steps": 33920, "loss": 0.5579, "lr": 9.934716896636329e-06, "epoch": 2.9274764150943398, "percentage": 14.64, "elapsed_time": "0:09:07", "remaining_time": "0:53:10", "throughput": 5907.77, "total_tokens": 3232048} {"current_steps": 4970, "total_steps": 33920, "loss": 0.6727, "lr": 9.934301862569764e-06, "epoch": 2.930424528301887, "percentage": 14.65, "elapsed_time": "0:09:07", "remaining_time": "0:53:09", "throughput": 5907.67, "total_tokens": 3234832} {"current_steps": 4975, "total_steps": 33920, "loss": 0.6517, "lr": 9.933885522125517e-06, "epoch": 2.933372641509434, "percentage": 14.67, "elapsed_time": "0:09:08", "remaining_time": "0:53:08", "throughput": 5907.53, "total_tokens": 3237648} {"current_steps": 4980, "total_steps": 33920, "loss": 0.6168, "lr": 9.933467875413813e-06, "epoch": 2.936320754716981, "percentage": 14.68, "elapsed_time": "0:09:08", "remaining_time": "0:53:07", "throughput": 5908.12, "total_tokens": 3240944} {"current_steps": 4985, "total_steps": 33920, "loss": 0.5366, "lr": 9.933048922545227e-06, "epoch": 2.9392688679245285, "percentage": 14.7, "elapsed_time": "0:09:09", "remaining_time": "0:53:06", "throughput": 5908.42, "total_tokens": 3244016} {"current_steps": 4990, "total_steps": 33920, "loss": 0.4305, "lr": 9.932628663630679e-06, "epoch": 2.9422169811320753, "percentage": 14.71, "elapsed_time": "0:09:09", "remaining_time": "0:53:05", "throughput": 5907.88, "total_tokens": 3246576} {"current_steps": 4995, "total_steps": 33920, "loss": 0.6666, "lr": 9.932207098781432e-06, "epoch": 2.9451650943396226, "percentage": 14.73, "elapsed_time": "0:09:10", "remaining_time": "0:53:05", "throughput": 5908.49, "total_tokens": 3250160} {"current_steps": 5000, "total_steps": 33920, "loss": 0.5147, "lr": 9.931784228109102e-06, "epoch": 2.94811320754717, "percentage": 14.74, "elapsed_time": "0:09:10", "remaining_time": "0:53:04", "throughput": 5908.84, "total_tokens": 3253296} {"current_steps": 5005, "total_steps": 33920, "loss": 0.459, "lr": 9.93136005172564e-06, "epoch": 2.951061320754717, "percentage": 14.76, "elapsed_time": "0:09:11", "remaining_time": "0:53:03", "throughput": 5908.8, "total_tokens": 3256496} {"current_steps": 5010, "total_steps": 33920, "loss": 0.4601, "lr": 9.930934569743354e-06, "epoch": 2.954009433962264, "percentage": 14.77, "elapsed_time": "0:09:11", "remaining_time": "0:53:03", "throughput": 5908.54, "total_tokens": 3259280} {"current_steps": 5015, "total_steps": 33920, "loss": 0.5588, "lr": 9.930507782274888e-06, "epoch": 2.9569575471698113, "percentage": 14.78, "elapsed_time": "0:09:12", "remaining_time": "0:53:03", "throughput": 5909.98, "total_tokens": 3264144} {"current_steps": 5020, "total_steps": 33920, "loss": 0.427, "lr": 9.930079689433236e-06, "epoch": 2.9599056603773586, "percentage": 14.8, "elapsed_time": "0:09:12", "remaining_time": "0:53:02", "throughput": 5910.39, "total_tokens": 3267440} {"current_steps": 5025, "total_steps": 33920, "loss": 0.5439, "lr": 9.92965029133174e-06, "epoch": 2.9628537735849054, "percentage": 14.81, "elapsed_time": "0:09:13", "remaining_time": "0:53:02", "throughput": 5911.19, "total_tokens": 3271760} {"current_steps": 5030, "total_steps": 33920, "loss": 0.4858, "lr": 9.929219588084084e-06, "epoch": 2.9658018867924527, "percentage": 14.83, "elapsed_time": "0:09:14", "remaining_time": "0:53:01", "throughput": 5911.85, "total_tokens": 3275216} {"current_steps": 5035, "total_steps": 33920, "loss": 0.4602, "lr": 9.9287875798043e-06, "epoch": 2.96875, "percentage": 14.84, "elapsed_time": "0:09:14", "remaining_time": "0:53:01", "throughput": 5912.52, "total_tokens": 3278992} {"current_steps": 5040, "total_steps": 33920, "loss": 0.5581, "lr": 9.92835426660676e-06, "epoch": 2.9716981132075473, "percentage": 14.86, "elapsed_time": "0:09:15", "remaining_time": "0:53:00", "throughput": 5912.27, "total_tokens": 3281776} {"current_steps": 5045, "total_steps": 33920, "loss": 0.4128, "lr": 9.927919648606188e-06, "epoch": 2.9746462264150946, "percentage": 14.87, "elapsed_time": "0:09:15", "remaining_time": "0:52:59", "throughput": 5911.7, "total_tokens": 3284304} {"current_steps": 5050, "total_steps": 33920, "loss": 0.3332, "lr": 9.927483725917652e-06, "epoch": 2.9775943396226414, "percentage": 14.89, "elapsed_time": "0:09:16", "remaining_time": "0:52:58", "throughput": 5910.91, "total_tokens": 3286896} {"current_steps": 5055, "total_steps": 33920, "loss": 0.5722, "lr": 9.927046498656562e-06, "epoch": 2.9805424528301887, "percentage": 14.9, "elapsed_time": "0:09:16", "remaining_time": "0:52:58", "throughput": 5911.22, "total_tokens": 3290128} {"current_steps": 5060, "total_steps": 33920, "loss": 0.597, "lr": 9.926607966938679e-06, "epoch": 2.983490566037736, "percentage": 14.92, "elapsed_time": "0:09:17", "remaining_time": "0:52:57", "throughput": 5911.49, "total_tokens": 3293520} {"current_steps": 5065, "total_steps": 33920, "loss": 0.4408, "lr": 9.926168130880103e-06, "epoch": 2.986438679245283, "percentage": 14.93, "elapsed_time": "0:09:17", "remaining_time": "0:52:56", "throughput": 5911.6, "total_tokens": 3296624} {"current_steps": 5070, "total_steps": 33920, "loss": 0.5116, "lr": 9.925726990597283e-06, "epoch": 2.98938679245283, "percentage": 14.95, "elapsed_time": "0:09:18", "remaining_time": "0:52:56", "throughput": 5912.22, "total_tokens": 3300080} {"current_steps": 5075, "total_steps": 33920, "loss": 0.5711, "lr": 9.925284546207015e-06, "epoch": 2.9923349056603774, "percentage": 14.96, "elapsed_time": "0:09:18", "remaining_time": "0:52:55", "throughput": 5912.4, "total_tokens": 3303280} {"current_steps": 5080, "total_steps": 33920, "loss": 0.524, "lr": 9.924840797826436e-06, "epoch": 2.9952830188679247, "percentage": 14.98, "elapsed_time": "0:09:19", "remaining_time": "0:52:54", "throughput": 5912.0, "total_tokens": 3306128} {"current_steps": 5085, "total_steps": 33920, "loss": 0.644, "lr": 9.924395745573029e-06, "epoch": 2.9982311320754715, "percentage": 14.99, "elapsed_time": "0:09:19", "remaining_time": "0:52:54", "throughput": 5912.17, "total_tokens": 3309264} {"current_steps": 5090, "total_steps": 33920, "loss": 0.572, "lr": 9.923949389564629e-06, "epoch": 3.001179245283019, "percentage": 15.01, "elapsed_time": "0:09:20", "remaining_time": "0:52:55", "throughput": 5908.38, "total_tokens": 3312280} {"current_steps": 5095, "total_steps": 33920, "loss": 0.5164, "lr": 9.923501729919404e-06, "epoch": 3.004127358490566, "percentage": 15.02, "elapsed_time": "0:09:21", "remaining_time": "0:52:54", "throughput": 5907.96, "total_tokens": 3314968} {"current_steps": 5100, "total_steps": 33920, "loss": 0.4092, "lr": 9.923052766755878e-06, "epoch": 3.0070754716981134, "percentage": 15.04, "elapsed_time": "0:09:21", "remaining_time": "0:52:53", "throughput": 5908.43, "total_tokens": 3318392} {"current_steps": 5105, "total_steps": 33920, "loss": 0.5324, "lr": 9.922602500192914e-06, "epoch": 3.0100235849056602, "percentage": 15.05, "elapsed_time": "0:09:22", "remaining_time": "0:52:52", "throughput": 5908.28, "total_tokens": 3321144} {"current_steps": 5110, "total_steps": 33920, "loss": 0.4799, "lr": 9.922150930349725e-06, "epoch": 3.0129716981132075, "percentage": 15.06, "elapsed_time": "0:09:22", "remaining_time": "0:52:52", "throughput": 5907.38, "total_tokens": 3323672} {"current_steps": 5115, "total_steps": 33920, "loss": 0.3751, "lr": 9.921698057345863e-06, "epoch": 3.015919811320755, "percentage": 15.08, "elapsed_time": "0:09:23", "remaining_time": "0:52:51", "throughput": 5907.41, "total_tokens": 3327064} {"current_steps": 5120, "total_steps": 33920, "loss": 0.499, "lr": 9.921243881301229e-06, "epoch": 3.018867924528302, "percentage": 15.09, "elapsed_time": "0:09:23", "remaining_time": "0:52:51", "throughput": 5908.12, "total_tokens": 3330840} {"current_steps": 5125, "total_steps": 33920, "loss": 0.3978, "lr": 9.920788402336068e-06, "epoch": 3.021816037735849, "percentage": 15.11, "elapsed_time": "0:09:24", "remaining_time": "0:52:50", "throughput": 5908.68, "total_tokens": 3334616} {"current_steps": 5130, "total_steps": 33920, "loss": 0.4086, "lr": 9.92033162057097e-06, "epoch": 3.0247641509433962, "percentage": 15.12, "elapsed_time": "0:09:24", "remaining_time": "0:52:50", "throughput": 5909.23, "total_tokens": 3337944} {"current_steps": 5135, "total_steps": 33920, "loss": 0.4396, "lr": 9.919873536126869e-06, "epoch": 3.0277122641509435, "percentage": 15.14, "elapsed_time": "0:09:25", "remaining_time": "0:52:49", "throughput": 5909.49, "total_tokens": 3341272} {"current_steps": 5140, "total_steps": 33920, "loss": 0.4916, "lr": 9.919414149125046e-06, "epoch": 3.0306603773584904, "percentage": 15.15, "elapsed_time": "0:09:25", "remaining_time": "0:52:48", "throughput": 5909.55, "total_tokens": 3344344} {"current_steps": 5145, "total_steps": 33920, "loss": 0.4229, "lr": 9.918953459687126e-06, "epoch": 3.0336084905660377, "percentage": 15.17, "elapsed_time": "0:09:26", "remaining_time": "0:52:47", "throughput": 5909.68, "total_tokens": 3347192} {"current_steps": 5150, "total_steps": 33920, "loss": 0.4529, "lr": 9.918491467935078e-06, "epoch": 3.036556603773585, "percentage": 15.18, "elapsed_time": "0:09:26", "remaining_time": "0:52:47", "throughput": 5910.66, "total_tokens": 3351224} {"current_steps": 5155, "total_steps": 33920, "loss": 0.4174, "lr": 9.918028173991218e-06, "epoch": 3.0395047169811322, "percentage": 15.2, "elapsed_time": "0:09:27", "remaining_time": "0:52:46", "throughput": 5910.22, "total_tokens": 3354072} {"current_steps": 5160, "total_steps": 33920, "loss": 0.4613, "lr": 9.917563577978202e-06, "epoch": 3.042452830188679, "percentage": 15.21, "elapsed_time": "0:09:27", "remaining_time": "0:52:45", "throughput": 5910.38, "total_tokens": 3356856} {"current_steps": 5165, "total_steps": 33920, "loss": 0.4816, "lr": 9.917097680019035e-06, "epoch": 3.0454009433962264, "percentage": 15.23, "elapsed_time": "0:09:28", "remaining_time": "0:52:45", "throughput": 5910.75, "total_tokens": 3360280} {"current_steps": 5170, "total_steps": 33920, "loss": 0.4723, "lr": 9.916630480237066e-06, "epoch": 3.0483490566037736, "percentage": 15.24, "elapsed_time": "0:09:28", "remaining_time": "0:52:44", "throughput": 5910.53, "total_tokens": 3362968} {"current_steps": 5175, "total_steps": 33920, "loss": 0.4736, "lr": 9.916161978755988e-06, "epoch": 3.051297169811321, "percentage": 15.26, "elapsed_time": "0:09:29", "remaining_time": "0:52:43", "throughput": 5911.29, "total_tokens": 3366648} {"current_steps": 5180, "total_steps": 33920, "loss": 0.4842, "lr": 9.915692175699838e-06, "epoch": 3.0542452830188678, "percentage": 15.27, "elapsed_time": "0:09:29", "remaining_time": "0:52:42", "throughput": 5911.16, "total_tokens": 3369304} {"current_steps": 5185, "total_steps": 33920, "loss": 0.5507, "lr": 9.915221071193e-06, "epoch": 3.057193396226415, "percentage": 15.29, "elapsed_time": "0:09:30", "remaining_time": "0:52:41", "throughput": 5911.51, "total_tokens": 3372504} {"current_steps": 5190, "total_steps": 33920, "loss": 0.4882, "lr": 9.914748665360199e-06, "epoch": 3.0601415094339623, "percentage": 15.3, "elapsed_time": "0:09:30", "remaining_time": "0:52:40", "throughput": 5911.44, "total_tokens": 3375096} {"current_steps": 5195, "total_steps": 33920, "loss": 0.6181, "lr": 9.914274958326507e-06, "epoch": 3.0630896226415096, "percentage": 15.32, "elapsed_time": "0:09:31", "remaining_time": "0:52:39", "throughput": 5910.95, "total_tokens": 3377592} {"current_steps": 5200, "total_steps": 33920, "loss": 0.5641, "lr": 9.913799950217341e-06, "epoch": 3.0660377358490565, "percentage": 15.33, "elapsed_time": "0:09:31", "remaining_time": "0:52:38", "throughput": 5911.3, "total_tokens": 3380728} {"current_steps": 5205, "total_steps": 33920, "loss": 0.4957, "lr": 9.91332364115846e-06, "epoch": 3.0689858490566038, "percentage": 15.34, "elapsed_time": "0:09:32", "remaining_time": "0:52:37", "throughput": 5911.19, "total_tokens": 3383416} {"current_steps": 5210, "total_steps": 33920, "loss": 0.5678, "lr": 9.912846031275972e-06, "epoch": 3.071933962264151, "percentage": 15.36, "elapsed_time": "0:09:32", "remaining_time": "0:52:37", "throughput": 5911.83, "total_tokens": 3386904} {"current_steps": 5215, "total_steps": 33920, "loss": 0.403, "lr": 9.912367120696322e-06, "epoch": 3.074882075471698, "percentage": 15.37, "elapsed_time": "0:09:33", "remaining_time": "0:52:36", "throughput": 5911.49, "total_tokens": 3389496} {"current_steps": 5220, "total_steps": 33920, "loss": 0.4631, "lr": 9.911886909546307e-06, "epoch": 3.077830188679245, "percentage": 15.39, "elapsed_time": "0:09:33", "remaining_time": "0:52:35", "throughput": 5911.82, "total_tokens": 3392856} {"current_steps": 5225, "total_steps": 33920, "loss": 0.4369, "lr": 9.911405397953063e-06, "epoch": 3.0807783018867925, "percentage": 15.4, "elapsed_time": "0:09:34", "remaining_time": "0:52:34", "throughput": 5912.07, "total_tokens": 3396280} {"current_steps": 5230, "total_steps": 33920, "loss": 0.4041, "lr": 9.910922586044073e-06, "epoch": 3.0837264150943398, "percentage": 15.42, "elapsed_time": "0:09:35", "remaining_time": "0:52:34", "throughput": 5912.52, "total_tokens": 3400216} {"current_steps": 5235, "total_steps": 33920, "loss": 0.4477, "lr": 9.910438473947163e-06, "epoch": 3.0866745283018866, "percentage": 15.43, "elapsed_time": "0:09:35", "remaining_time": "0:52:33", "throughput": 5912.06, "total_tokens": 3402744} {"current_steps": 5240, "total_steps": 33920, "loss": 0.6051, "lr": 9.909953061790506e-06, "epoch": 3.089622641509434, "percentage": 15.45, "elapsed_time": "0:09:36", "remaining_time": "0:52:33", "throughput": 5912.14, "total_tokens": 3405816} {"current_steps": 5245, "total_steps": 33920, "loss": 0.5483, "lr": 9.909466349702613e-06, "epoch": 3.092570754716981, "percentage": 15.46, "elapsed_time": "0:09:36", "remaining_time": "0:52:32", "throughput": 5912.1, "total_tokens": 3408824} {"current_steps": 5250, "total_steps": 33920, "loss": 0.4303, "lr": 9.908978337812348e-06, "epoch": 3.0955188679245285, "percentage": 15.48, "elapsed_time": "0:09:37", "remaining_time": "0:52:31", "throughput": 5912.46, "total_tokens": 3412504} {"current_steps": 5255, "total_steps": 33920, "loss": 0.6035, "lr": 9.908489026248909e-06, "epoch": 3.0984669811320753, "percentage": 15.49, "elapsed_time": "0:09:37", "remaining_time": "0:52:30", "throughput": 5912.43, "total_tokens": 3415192} {"current_steps": 5260, "total_steps": 33920, "loss": 0.4859, "lr": 9.907998415141846e-06, "epoch": 3.1014150943396226, "percentage": 15.51, "elapsed_time": "0:09:38", "remaining_time": "0:52:30", "throughput": 5912.38, "total_tokens": 3418456} {"current_steps": 5265, "total_steps": 33920, "loss": 0.4454, "lr": 9.907506504621052e-06, "epoch": 3.10436320754717, "percentage": 15.52, "elapsed_time": "0:09:38", "remaining_time": "0:52:29", "throughput": 5912.7, "total_tokens": 3421560} {"current_steps": 5270, "total_steps": 33920, "loss": 0.5021, "lr": 9.907013294816759e-06, "epoch": 3.107311320754717, "percentage": 15.54, "elapsed_time": "0:09:39", "remaining_time": "0:52:29", "throughput": 5913.28, "total_tokens": 3425272} {"current_steps": 5275, "total_steps": 33920, "loss": 0.4863, "lr": 9.906518785859548e-06, "epoch": 3.110259433962264, "percentage": 15.55, "elapsed_time": "0:09:39", "remaining_time": "0:52:28", "throughput": 5913.4, "total_tokens": 3428216} {"current_steps": 5280, "total_steps": 33920, "loss": 0.3763, "lr": 9.906022977880344e-06, "epoch": 3.1132075471698113, "percentage": 15.57, "elapsed_time": "0:09:40", "remaining_time": "0:52:27", "throughput": 5913.44, "total_tokens": 3431032} {"current_steps": 5285, "total_steps": 33920, "loss": 0.3967, "lr": 9.905525871010412e-06, "epoch": 3.1161556603773586, "percentage": 15.58, "elapsed_time": "0:09:40", "remaining_time": "0:52:26", "throughput": 5913.28, "total_tokens": 3434104} {"current_steps": 5290, "total_steps": 33920, "loss": 0.4336, "lr": 9.905027465381363e-06, "epoch": 3.119103773584906, "percentage": 15.6, "elapsed_time": "0:09:41", "remaining_time": "0:52:25", "throughput": 5913.08, "total_tokens": 3436824} {"current_steps": 5295, "total_steps": 33920, "loss": 0.6082, "lr": 9.904527761125155e-06, "epoch": 3.1220518867924527, "percentage": 15.61, "elapsed_time": "0:09:41", "remaining_time": "0:52:24", "throughput": 5912.71, "total_tokens": 3439352} {"current_steps": 5300, "total_steps": 33920, "loss": 0.381, "lr": 9.904026758374083e-06, "epoch": 3.125, "percentage": 15.62, "elapsed_time": "0:09:42", "remaining_time": "0:52:24", "throughput": 5912.46, "total_tokens": 3442680} {"current_steps": 5305, "total_steps": 33920, "loss": 0.4136, "lr": 9.903524457260794e-06, "epoch": 3.1279481132075473, "percentage": 15.64, "elapsed_time": "0:09:42", "remaining_time": "0:52:23", "throughput": 5912.72, "total_tokens": 3445944} {"current_steps": 5310, "total_steps": 33920, "loss": 0.4896, "lr": 9.90302085791827e-06, "epoch": 3.1308962264150946, "percentage": 15.65, "elapsed_time": "0:09:43", "remaining_time": "0:52:22", "throughput": 5913.02, "total_tokens": 3449080} {"current_steps": 5315, "total_steps": 33920, "loss": 0.5089, "lr": 9.902515960479844e-06, "epoch": 3.1338443396226414, "percentage": 15.67, "elapsed_time": "0:09:43", "remaining_time": "0:52:22", "throughput": 5914.04, "total_tokens": 3453208} {"current_steps": 5320, "total_steps": 33920, "loss": 0.5379, "lr": 9.902009765079188e-06, "epoch": 3.1367924528301887, "percentage": 15.68, "elapsed_time": "0:09:44", "remaining_time": "0:52:21", "throughput": 5914.82, "total_tokens": 3456856} {"current_steps": 5325, "total_steps": 33920, "loss": 0.462, "lr": 9.90150227185032e-06, "epoch": 3.139740566037736, "percentage": 15.7, "elapsed_time": "0:09:44", "remaining_time": "0:52:20", "throughput": 5914.77, "total_tokens": 3459672} {"current_steps": 5330, "total_steps": 33920, "loss": 0.5942, "lr": 9.900993480927603e-06, "epoch": 3.142688679245283, "percentage": 15.71, "elapsed_time": "0:09:45", "remaining_time": "0:52:20", "throughput": 5913.81, "total_tokens": 3462040} {"current_steps": 5335, "total_steps": 33920, "loss": 0.5012, "lr": 9.90048339244574e-06, "epoch": 3.14563679245283, "percentage": 15.73, "elapsed_time": "0:09:45", "remaining_time": "0:52:19", "throughput": 5913.68, "total_tokens": 3464856} {"current_steps": 5340, "total_steps": 33920, "loss": 0.4121, "lr": 9.899972006539776e-06, "epoch": 3.1485849056603774, "percentage": 15.74, "elapsed_time": "0:09:46", "remaining_time": "0:52:18", "throughput": 5914.01, "total_tokens": 3467928} {"current_steps": 5345, "total_steps": 33920, "loss": 0.5219, "lr": 9.899459323345106e-06, "epoch": 3.1515330188679247, "percentage": 15.76, "elapsed_time": "0:09:46", "remaining_time": "0:52:17", "throughput": 5914.23, "total_tokens": 3471096} {"current_steps": 5350, "total_steps": 33920, "loss": 0.4654, "lr": 9.898945342997467e-06, "epoch": 3.1544811320754715, "percentage": 15.77, "elapsed_time": "0:09:47", "remaining_time": "0:52:17", "throughput": 5913.87, "total_tokens": 3474808} {"current_steps": 5355, "total_steps": 33920, "loss": 0.3936, "lr": 9.898430065632933e-06, "epoch": 3.157429245283019, "percentage": 15.79, "elapsed_time": "0:09:48", "remaining_time": "0:52:17", "throughput": 5914.21, "total_tokens": 3478296} {"current_steps": 5360, "total_steps": 33920, "loss": 0.4716, "lr": 9.897913491387929e-06, "epoch": 3.160377358490566, "percentage": 15.8, "elapsed_time": "0:09:48", "remaining_time": "0:52:16", "throughput": 5914.23, "total_tokens": 3481304} {"current_steps": 5365, "total_steps": 33920, "loss": 0.5651, "lr": 9.897395620399219e-06, "epoch": 3.1633254716981134, "percentage": 15.82, "elapsed_time": "0:09:49", "remaining_time": "0:52:16", "throughput": 5915.45, "total_tokens": 3486200} {"current_steps": 5370, "total_steps": 33920, "loss": 0.5685, "lr": 9.896876452803913e-06, "epoch": 3.1662735849056602, "percentage": 15.83, "elapsed_time": "0:09:49", "remaining_time": "0:52:16", "throughput": 5916.1, "total_tokens": 3489784} {"current_steps": 5375, "total_steps": 33920, "loss": 0.4432, "lr": 9.896355988739461e-06, "epoch": 3.1692216981132075, "percentage": 15.85, "elapsed_time": "0:09:50", "remaining_time": "0:52:15", "throughput": 5916.04, "total_tokens": 3492824} {"current_steps": 5380, "total_steps": 33920, "loss": 0.5175, "lr": 9.895834228343658e-06, "epoch": 3.172169811320755, "percentage": 15.86, "elapsed_time": "0:09:50", "remaining_time": "0:52:14", "throughput": 5916.14, "total_tokens": 3495736} {"current_steps": 5385, "total_steps": 33920, "loss": 0.5193, "lr": 9.895311171754644e-06, "epoch": 3.175117924528302, "percentage": 15.88, "elapsed_time": "0:09:51", "remaining_time": "0:52:13", "throughput": 5916.18, "total_tokens": 3498616} {"current_steps": 5390, "total_steps": 33920, "loss": 0.5631, "lr": 9.8947868191109e-06, "epoch": 3.178066037735849, "percentage": 15.89, "elapsed_time": "0:09:51", "remaining_time": "0:52:12", "throughput": 5916.76, "total_tokens": 3501976} {"current_steps": 5395, "total_steps": 33920, "loss": 0.4348, "lr": 9.894261170551249e-06, "epoch": 3.1810141509433962, "percentage": 15.91, "elapsed_time": "0:09:52", "remaining_time": "0:52:13", "throughput": 5918.06, "total_tokens": 3507096} {"current_steps": 5400, "total_steps": 33920, "loss": 0.4042, "lr": 9.893734226214861e-06, "epoch": 3.1839622641509435, "percentage": 15.92, "elapsed_time": "0:09:53", "remaining_time": "0:52:12", "throughput": 5918.44, "total_tokens": 3510776} {"current_steps": 5405, "total_steps": 33920, "loss": 0.4858, "lr": 9.893205986241246e-06, "epoch": 3.1869103773584904, "percentage": 15.93, "elapsed_time": "0:09:53", "remaining_time": "0:52:12", "throughput": 5918.78, "total_tokens": 3514712} {"current_steps": 5410, "total_steps": 33920, "loss": 0.3711, "lr": 9.892676450770257e-06, "epoch": 3.1898584905660377, "percentage": 15.95, "elapsed_time": "0:09:54", "remaining_time": "0:52:12", "throughput": 5918.55, "total_tokens": 3517688} {"current_steps": 5415, "total_steps": 33920, "loss": 0.3671, "lr": 9.892145619942092e-06, "epoch": 3.192806603773585, "percentage": 15.96, "elapsed_time": "0:09:54", "remaining_time": "0:52:11", "throughput": 5918.72, "total_tokens": 3520760} {"current_steps": 5420, "total_steps": 33920, "loss": 0.4361, "lr": 9.891613493897289e-06, "epoch": 3.1957547169811322, "percentage": 15.98, "elapsed_time": "0:09:55", "remaining_time": "0:52:10", "throughput": 5918.54, "total_tokens": 3523672} {"current_steps": 5425, "total_steps": 33920, "loss": 0.6848, "lr": 9.891080072776733e-06, "epoch": 3.198702830188679, "percentage": 15.99, "elapsed_time": "0:09:55", "remaining_time": "0:52:09", "throughput": 5918.49, "total_tokens": 3526552} {"current_steps": 5430, "total_steps": 33920, "loss": 0.5061, "lr": 9.890545356721649e-06, "epoch": 3.2016509433962264, "percentage": 16.01, "elapsed_time": "0:09:56", "remaining_time": "0:52:09", "throughput": 5919.04, "total_tokens": 3530552} {"current_steps": 5435, "total_steps": 33920, "loss": 0.4507, "lr": 9.890009345873603e-06, "epoch": 3.2045990566037736, "percentage": 16.02, "elapsed_time": "0:09:56", "remaining_time": "0:52:08", "throughput": 5919.33, "total_tokens": 3533656} {"current_steps": 5440, "total_steps": 33920, "loss": 0.3722, "lr": 9.889472040374509e-06, "epoch": 3.207547169811321, "percentage": 16.04, "elapsed_time": "0:09:57", "remaining_time": "0:52:07", "throughput": 5919.36, "total_tokens": 3536632} {"current_steps": 5445, "total_steps": 33920, "loss": 0.4766, "lr": 9.88893344036662e-06, "epoch": 3.2104952830188678, "percentage": 16.05, "elapsed_time": "0:09:57", "remaining_time": "0:52:07", "throughput": 5918.81, "total_tokens": 3539256} {"current_steps": 5450, "total_steps": 33920, "loss": 0.5999, "lr": 9.888393545992531e-06, "epoch": 3.213443396226415, "percentage": 16.07, "elapsed_time": "0:09:58", "remaining_time": "0:52:06", "throughput": 5917.83, "total_tokens": 3541624} {"current_steps": 5455, "total_steps": 33920, "loss": 0.3474, "lr": 9.887852357395184e-06, "epoch": 3.2163915094339623, "percentage": 16.08, "elapsed_time": "0:09:59", "remaining_time": "0:52:05", "throughput": 5918.25, "total_tokens": 3545272} {"current_steps": 5460, "total_steps": 33920, "loss": 0.4934, "lr": 9.88730987471786e-06, "epoch": 3.2193396226415096, "percentage": 16.1, "elapsed_time": "0:09:59", "remaining_time": "0:52:05", "throughput": 5918.65, "total_tokens": 3548760} {"current_steps": 5465, "total_steps": 33920, "loss": 0.5045, "lr": 9.886766098104183e-06, "epoch": 3.2222877358490565, "percentage": 16.11, "elapsed_time": "0:10:00", "remaining_time": "0:52:05", "throughput": 5919.79, "total_tokens": 3553208} {"current_steps": 5470, "total_steps": 33920, "loss": 0.4052, "lr": 9.886221027698122e-06, "epoch": 3.2252358490566038, "percentage": 16.13, "elapsed_time": "0:10:00", "remaining_time": "0:52:04", "throughput": 5919.61, "total_tokens": 3555800} {"current_steps": 5475, "total_steps": 33920, "loss": 0.6302, "lr": 9.885674663643983e-06, "epoch": 3.228183962264151, "percentage": 16.14, "elapsed_time": "0:10:01", "remaining_time": "0:52:03", "throughput": 5919.78, "total_tokens": 3558616} {"current_steps": 5480, "total_steps": 33920, "loss": 0.734, "lr": 9.885127006086423e-06, "epoch": 3.231132075471698, "percentage": 16.16, "elapsed_time": "0:10:01", "remaining_time": "0:52:02", "throughput": 5920.44, "total_tokens": 3562264} {"current_steps": 5485, "total_steps": 33920, "loss": 0.5638, "lr": 9.884578055170434e-06, "epoch": 3.234080188679245, "percentage": 16.17, "elapsed_time": "0:10:02", "remaining_time": "0:52:02", "throughput": 5920.93, "total_tokens": 3565912} {"current_steps": 5490, "total_steps": 33920, "loss": 0.4199, "lr": 9.884027811041353e-06, "epoch": 3.2370283018867925, "percentage": 16.19, "elapsed_time": "0:10:02", "remaining_time": "0:52:02", "throughput": 5921.92, "total_tokens": 3570200} {"current_steps": 5495, "total_steps": 33920, "loss": 0.5261, "lr": 9.883476273844861e-06, "epoch": 3.2399764150943398, "percentage": 16.2, "elapsed_time": "0:10:03", "remaining_time": "0:52:00", "throughput": 5922.06, "total_tokens": 3572952} {"current_steps": 5500, "total_steps": 33920, "loss": 0.3781, "lr": 9.882923443726977e-06, "epoch": 3.2429245283018866, "percentage": 16.21, "elapsed_time": "0:10:03", "remaining_time": "0:52:00", "throughput": 5922.13, "total_tokens": 3575800} {"current_steps": 5505, "total_steps": 33920, "loss": 0.4212, "lr": 9.882369320834068e-06, "epoch": 3.245872641509434, "percentage": 16.23, "elapsed_time": "0:10:04", "remaining_time": "0:51:59", "throughput": 5922.54, "total_tokens": 3579256} {"current_steps": 5510, "total_steps": 33920, "loss": 0.4401, "lr": 9.88181390531284e-06, "epoch": 3.248820754716981, "percentage": 16.24, "elapsed_time": "0:10:04", "remaining_time": "0:51:59", "throughput": 5923.15, "total_tokens": 3583160} {"current_steps": 5515, "total_steps": 33920, "loss": 0.4397, "lr": 9.88125719731034e-06, "epoch": 3.2517688679245285, "percentage": 16.26, "elapsed_time": "0:10:05", "remaining_time": "0:51:58", "throughput": 5924.07, "total_tokens": 3587448} {"current_steps": 5520, "total_steps": 33920, "loss": 0.4377, "lr": 9.880699196973962e-06, "epoch": 3.2547169811320753, "percentage": 16.27, "elapsed_time": "0:10:06", "remaining_time": "0:51:58", "throughput": 5924.85, "total_tokens": 3591160} {"current_steps": 5525, "total_steps": 33920, "loss": 0.4794, "lr": 9.880139904451436e-06, "epoch": 3.2576650943396226, "percentage": 16.29, "elapsed_time": "0:10:06", "remaining_time": "0:51:57", "throughput": 5924.78, "total_tokens": 3593880} {"current_steps": 5530, "total_steps": 33920, "loss": 0.4034, "lr": 9.879579319890838e-06, "epoch": 3.26061320754717, "percentage": 16.3, "elapsed_time": "0:10:07", "remaining_time": "0:51:56", "throughput": 5924.92, "total_tokens": 3596792} {"current_steps": 5535, "total_steps": 33920, "loss": 0.4078, "lr": 9.879017443440584e-06, "epoch": 3.263561320754717, "percentage": 16.32, "elapsed_time": "0:10:07", "remaining_time": "0:51:55", "throughput": 5925.23, "total_tokens": 3599928} {"current_steps": 5540, "total_steps": 33920, "loss": 0.4507, "lr": 9.878454275249436e-06, "epoch": 3.266509433962264, "percentage": 16.33, "elapsed_time": "0:10:08", "remaining_time": "0:51:54", "throughput": 5925.22, "total_tokens": 3602872} {"current_steps": 5545, "total_steps": 33920, "loss": 0.4563, "lr": 9.877889815466493e-06, "epoch": 3.2694575471698113, "percentage": 16.35, "elapsed_time": "0:10:08", "remaining_time": "0:51:54", "throughput": 5925.74, "total_tokens": 3606328} {"current_steps": 5550, "total_steps": 33920, "loss": 0.4057, "lr": 9.877324064241198e-06, "epoch": 3.2724056603773586, "percentage": 16.36, "elapsed_time": "0:10:09", "remaining_time": "0:51:53", "throughput": 5925.77, "total_tokens": 3609400} {"current_steps": 5555, "total_steps": 33920, "loss": 0.5476, "lr": 9.876757021723338e-06, "epoch": 3.2753537735849054, "percentage": 16.38, "elapsed_time": "0:10:09", "remaining_time": "0:51:52", "throughput": 5925.72, "total_tokens": 3612216} {"current_steps": 5560, "total_steps": 33920, "loss": 0.3909, "lr": 9.876188688063038e-06, "epoch": 3.2783018867924527, "percentage": 16.39, "elapsed_time": "0:10:10", "remaining_time": "0:51:52", "throughput": 5926.29, "total_tokens": 3616408} {"current_steps": 5565, "total_steps": 33920, "loss": 0.4765, "lr": 9.875619063410768e-06, "epoch": 3.28125, "percentage": 16.41, "elapsed_time": "0:10:10", "remaining_time": "0:51:52", "throughput": 5926.93, "total_tokens": 3620216} {"current_steps": 5570, "total_steps": 33920, "loss": 0.6603, "lr": 9.875048147917339e-06, "epoch": 3.2841981132075473, "percentage": 16.42, "elapsed_time": "0:10:11", "remaining_time": "0:51:51", "throughput": 5927.22, "total_tokens": 3623384} {"current_steps": 5575, "total_steps": 33920, "loss": 0.3378, "lr": 9.874475941733902e-06, "epoch": 3.2871462264150946, "percentage": 16.44, "elapsed_time": "0:10:11", "remaining_time": "0:51:50", "throughput": 5927.66, "total_tokens": 3626712} {"current_steps": 5580, "total_steps": 33920, "loss": 0.4546, "lr": 9.873902445011952e-06, "epoch": 3.2900943396226414, "percentage": 16.45, "elapsed_time": "0:10:12", "remaining_time": "0:51:50", "throughput": 5927.52, "total_tokens": 3629752} {"current_steps": 5585, "total_steps": 33920, "loss": 0.5013, "lr": 9.873327657903324e-06, "epoch": 3.2930424528301887, "percentage": 16.47, "elapsed_time": "0:10:12", "remaining_time": "0:51:49", "throughput": 5927.53, "total_tokens": 3632536} {"current_steps": 5590, "total_steps": 33920, "loss": 0.3636, "lr": 9.872751580560194e-06, "epoch": 3.295990566037736, "percentage": 16.48, "elapsed_time": "0:10:13", "remaining_time": "0:51:48", "throughput": 5927.75, "total_tokens": 3635768} {"current_steps": 5595, "total_steps": 33920, "loss": 0.3771, "lr": 9.872174213135084e-06, "epoch": 3.298938679245283, "percentage": 16.49, "elapsed_time": "0:10:13", "remaining_time": "0:51:47", "throughput": 5927.55, "total_tokens": 3638424} {"current_steps": 5600, "total_steps": 33920, "loss": 0.4962, "lr": 9.871595555780855e-06, "epoch": 3.30188679245283, "percentage": 16.51, "elapsed_time": "0:10:14", "remaining_time": "0:51:46", "throughput": 5927.93, "total_tokens": 3641912} {"current_steps": 5605, "total_steps": 33920, "loss": 0.4433, "lr": 9.871015608650705e-06, "epoch": 3.3048349056603774, "percentage": 16.52, "elapsed_time": "0:10:14", "remaining_time": "0:51:46", "throughput": 5927.94, "total_tokens": 3644856} {"current_steps": 5610, "total_steps": 33920, "loss": 0.5282, "lr": 9.870434371898182e-06, "epoch": 3.3077830188679247, "percentage": 16.54, "elapsed_time": "0:10:15", "remaining_time": "0:51:45", "throughput": 5928.23, "total_tokens": 3647960} {"current_steps": 5615, "total_steps": 33920, "loss": 0.4544, "lr": 9.869851845677165e-06, "epoch": 3.3107311320754715, "percentage": 16.55, "elapsed_time": "0:10:15", "remaining_time": "0:51:44", "throughput": 5928.82, "total_tokens": 3651416} {"current_steps": 5620, "total_steps": 33920, "loss": 0.4013, "lr": 9.869268030141886e-06, "epoch": 3.313679245283019, "percentage": 16.57, "elapsed_time": "0:10:16", "remaining_time": "0:51:44", "throughput": 5929.63, "total_tokens": 3655192} {"current_steps": 5625, "total_steps": 33920, "loss": 0.4207, "lr": 9.86868292544691e-06, "epoch": 3.316627358490566, "percentage": 16.58, "elapsed_time": "0:10:16", "remaining_time": "0:51:43", "throughput": 5929.62, "total_tokens": 3658200} {"current_steps": 5630, "total_steps": 33920, "loss": 0.5041, "lr": 9.868096531747149e-06, "epoch": 3.3195754716981134, "percentage": 16.6, "elapsed_time": "0:10:17", "remaining_time": "0:51:42", "throughput": 5930.11, "total_tokens": 3661720} {"current_steps": 5635, "total_steps": 33920, "loss": 0.4718, "lr": 9.867508849197848e-06, "epoch": 3.3225235849056602, "percentage": 16.61, "elapsed_time": "0:10:17", "remaining_time": "0:51:41", "throughput": 5929.79, "total_tokens": 3664216} {"current_steps": 5640, "total_steps": 33920, "loss": 0.5067, "lr": 9.866919877954602e-06, "epoch": 3.3254716981132075, "percentage": 16.63, "elapsed_time": "0:10:18", "remaining_time": "0:51:41", "throughput": 5930.03, "total_tokens": 3667800} {"current_steps": 5645, "total_steps": 33920, "loss": 0.485, "lr": 9.866329618173344e-06, "epoch": 3.328419811320755, "percentage": 16.64, "elapsed_time": "0:10:19", "remaining_time": "0:51:41", "throughput": 5930.65, "total_tokens": 3671800} {"current_steps": 5650, "total_steps": 33920, "loss": 0.4444, "lr": 9.865738070010346e-06, "epoch": 3.331367924528302, "percentage": 16.66, "elapsed_time": "0:10:19", "remaining_time": "0:51:40", "throughput": 5930.4, "total_tokens": 3674424} {"current_steps": 5655, "total_steps": 33920, "loss": 0.5183, "lr": 9.865145233622223e-06, "epoch": 3.334316037735849, "percentage": 16.67, "elapsed_time": "0:10:20", "remaining_time": "0:51:39", "throughput": 5930.46, "total_tokens": 3677144} {"current_steps": 5660, "total_steps": 33920, "loss": 0.6434, "lr": 9.864551109165935e-06, "epoch": 3.3372641509433962, "percentage": 16.69, "elapsed_time": "0:10:20", "remaining_time": "0:51:38", "throughput": 5930.11, "total_tokens": 3679768} {"current_steps": 5665, "total_steps": 33920, "loss": 0.4124, "lr": 9.863955696798773e-06, "epoch": 3.3402122641509435, "percentage": 16.7, "elapsed_time": "0:10:21", "remaining_time": "0:51:40", "throughput": 5931.54, "total_tokens": 3687576} {"current_steps": 5670, "total_steps": 33920, "loss": 0.4306, "lr": 9.863358996678378e-06, "epoch": 3.3431603773584904, "percentage": 16.72, "elapsed_time": "0:10:22", "remaining_time": "0:51:40", "throughput": 5931.53, "total_tokens": 3690936} {"current_steps": 5675, "total_steps": 33920, "loss": 0.3543, "lr": 9.86276100896273e-06, "epoch": 3.3461084905660377, "percentage": 16.73, "elapsed_time": "0:10:22", "remaining_time": "0:51:39", "throughput": 5932.09, "total_tokens": 3694616} {"current_steps": 5680, "total_steps": 33920, "loss": 0.5386, "lr": 9.862161733810147e-06, "epoch": 3.349056603773585, "percentage": 16.75, "elapsed_time": "0:10:23", "remaining_time": "0:51:39", "throughput": 5932.04, "total_tokens": 3697720} {"current_steps": 5685, "total_steps": 33920, "loss": 0.4007, "lr": 9.86156117137929e-06, "epoch": 3.3520047169811322, "percentage": 16.76, "elapsed_time": "0:10:23", "remaining_time": "0:51:38", "throughput": 5931.32, "total_tokens": 3700120} {"current_steps": 5690, "total_steps": 33920, "loss": 0.4636, "lr": 9.860959321829159e-06, "epoch": 3.354952830188679, "percentage": 16.77, "elapsed_time": "0:10:24", "remaining_time": "0:51:37", "throughput": 5931.74, "total_tokens": 3703768} {"current_steps": 5695, "total_steps": 33920, "loss": 0.514, "lr": 9.860356185319102e-06, "epoch": 3.3579009433962264, "percentage": 16.79, "elapsed_time": "0:10:24", "remaining_time": "0:51:37", "throughput": 5932.25, "total_tokens": 3707448} {"current_steps": 5700, "total_steps": 33920, "loss": 0.4787, "lr": 9.859751762008796e-06, "epoch": 3.3608490566037736, "percentage": 16.8, "elapsed_time": "0:10:25", "remaining_time": "0:51:36", "throughput": 5931.9, "total_tokens": 3709976} {"current_steps": 5705, "total_steps": 33920, "loss": 0.6716, "lr": 9.859146052058266e-06, "epoch": 3.363797169811321, "percentage": 16.82, "elapsed_time": "0:10:25", "remaining_time": "0:51:35", "throughput": 5931.77, "total_tokens": 3713208} {"current_steps": 5710, "total_steps": 33920, "loss": 0.3992, "lr": 9.858539055627876e-06, "epoch": 3.3667452830188678, "percentage": 16.83, "elapsed_time": "0:10:26", "remaining_time": "0:51:35", "throughput": 5932.02, "total_tokens": 3716504} {"current_steps": 5715, "total_steps": 33920, "loss": 0.6256, "lr": 9.857930772878333e-06, "epoch": 3.369693396226415, "percentage": 16.85, "elapsed_time": "0:10:27", "remaining_time": "0:51:34", "throughput": 5931.01, "total_tokens": 3718744} {"current_steps": 5720, "total_steps": 33920, "loss": 0.4481, "lr": 9.857321203970682e-06, "epoch": 3.3726415094339623, "percentage": 16.86, "elapsed_time": "0:10:27", "remaining_time": "0:51:33", "throughput": 5930.21, "total_tokens": 3721112} {"current_steps": 5725, "total_steps": 33920, "loss": 0.5411, "lr": 9.856710349066307e-06, "epoch": 3.3755896226415096, "percentage": 16.88, "elapsed_time": "0:10:28", "remaining_time": "0:51:33", "throughput": 5930.55, "total_tokens": 3725048} {"current_steps": 5730, "total_steps": 33920, "loss": 0.4255, "lr": 9.856098208326937e-06, "epoch": 3.3785377358490565, "percentage": 16.89, "elapsed_time": "0:10:28", "remaining_time": "0:51:32", "throughput": 5930.63, "total_tokens": 3728504} {"current_steps": 5735, "total_steps": 33920, "loss": 0.5363, "lr": 9.855484781914639e-06, "epoch": 3.3814858490566038, "percentage": 16.91, "elapsed_time": "0:10:29", "remaining_time": "0:51:32", "throughput": 5930.7, "total_tokens": 3731448} {"current_steps": 5740, "total_steps": 33920, "loss": 0.5811, "lr": 9.854870069991817e-06, "epoch": 3.384433962264151, "percentage": 16.92, "elapsed_time": "0:10:29", "remaining_time": "0:51:31", "throughput": 5931.19, "total_tokens": 3734808} {"current_steps": 5745, "total_steps": 33920, "loss": 0.5007, "lr": 9.854254072721222e-06, "epoch": 3.387382075471698, "percentage": 16.94, "elapsed_time": "0:10:30", "remaining_time": "0:51:30", "throughput": 5931.32, "total_tokens": 3737688} {"current_steps": 5750, "total_steps": 33920, "loss": 0.4135, "lr": 9.853636790265938e-06, "epoch": 3.390330188679245, "percentage": 16.95, "elapsed_time": "0:10:30", "remaining_time": "0:51:29", "throughput": 5931.63, "total_tokens": 3740888} {"current_steps": 5755, "total_steps": 33920, "loss": 0.3697, "lr": 9.853018222789397e-06, "epoch": 3.3932783018867925, "percentage": 16.97, "elapsed_time": "0:10:31", "remaining_time": "0:51:29", "throughput": 5931.61, "total_tokens": 3744184} {"current_steps": 5760, "total_steps": 33920, "loss": 0.4767, "lr": 9.852398370455367e-06, "epoch": 3.3962264150943398, "percentage": 16.98, "elapsed_time": "0:10:31", "remaining_time": "0:51:28", "throughput": 5931.67, "total_tokens": 3747384} {"current_steps": 5765, "total_steps": 33920, "loss": 0.5057, "lr": 9.851777233427955e-06, "epoch": 3.3991745283018866, "percentage": 17.0, "elapsed_time": "0:10:32", "remaining_time": "0:51:28", "throughput": 5931.19, "total_tokens": 3750296} {"current_steps": 5770, "total_steps": 33920, "loss": 0.3903, "lr": 9.85115481187161e-06, "epoch": 3.402122641509434, "percentage": 17.01, "elapsed_time": "0:10:32", "remaining_time": "0:51:27", "throughput": 5931.44, "total_tokens": 3753624} {"current_steps": 5775, "total_steps": 33920, "loss": 0.502, "lr": 9.850531105951123e-06, "epoch": 3.405070754716981, "percentage": 17.03, "elapsed_time": "0:10:33", "remaining_time": "0:51:26", "throughput": 5932.04, "total_tokens": 3757400} {"current_steps": 5780, "total_steps": 33920, "loss": 0.4246, "lr": 9.84990611583162e-06, "epoch": 3.4080188679245285, "percentage": 17.04, "elapsed_time": "0:10:33", "remaining_time": "0:51:26", "throughput": 5931.95, "total_tokens": 3760344} {"current_steps": 5785, "total_steps": 33920, "loss": 0.4753, "lr": 9.849279841678572e-06, "epoch": 3.4109669811320753, "percentage": 17.05, "elapsed_time": "0:10:34", "remaining_time": "0:51:25", "throughput": 5932.34, "total_tokens": 3763512} {"current_steps": 5790, "total_steps": 33920, "loss": 0.4299, "lr": 9.848652283657785e-06, "epoch": 3.4139150943396226, "percentage": 17.07, "elapsed_time": "0:10:34", "remaining_time": "0:51:24", "throughput": 5932.11, "total_tokens": 3766232} {"current_steps": 5795, "total_steps": 33920, "loss": 0.3983, "lr": 9.848023441935411e-06, "epoch": 3.41686320754717, "percentage": 17.08, "elapsed_time": "0:10:35", "remaining_time": "0:51:24", "throughput": 5932.97, "total_tokens": 3770616} {"current_steps": 5800, "total_steps": 33920, "loss": 0.3599, "lr": 9.847393316677935e-06, "epoch": 3.419811320754717, "percentage": 17.1, "elapsed_time": "0:10:36", "remaining_time": "0:51:23", "throughput": 5933.02, "total_tokens": 3773464} {"current_steps": 5805, "total_steps": 33920, "loss": 0.4248, "lr": 9.846761908052188e-06, "epoch": 3.422759433962264, "percentage": 17.11, "elapsed_time": "0:10:36", "remaining_time": "0:51:22", "throughput": 5932.97, "total_tokens": 3776472} {"current_steps": 5810, "total_steps": 33920, "loss": 0.4617, "lr": 9.846129216225338e-06, "epoch": 3.4257075471698113, "percentage": 17.13, "elapsed_time": "0:10:37", "remaining_time": "0:51:22", "throughput": 5933.41, "total_tokens": 3780056} {"current_steps": 5815, "total_steps": 33920, "loss": 0.4772, "lr": 9.845495241364892e-06, "epoch": 3.4286556603773586, "percentage": 17.14, "elapsed_time": "0:10:37", "remaining_time": "0:51:21", "throughput": 5933.93, "total_tokens": 3783800} {"current_steps": 5820, "total_steps": 33920, "loss": 0.4921, "lr": 9.844859983638696e-06, "epoch": 3.4316037735849054, "percentage": 17.16, "elapsed_time": "0:10:38", "remaining_time": "0:51:21", "throughput": 5934.04, "total_tokens": 3786744} {"current_steps": 5825, "total_steps": 33920, "loss": 0.5713, "lr": 9.844223443214942e-06, "epoch": 3.4345518867924527, "percentage": 17.17, "elapsed_time": "0:10:38", "remaining_time": "0:51:20", "throughput": 5934.16, "total_tokens": 3789624} {"current_steps": 5830, "total_steps": 33920, "loss": 0.4781, "lr": 9.843585620262153e-06, "epoch": 3.4375, "percentage": 17.19, "elapsed_time": "0:10:39", "remaining_time": "0:51:19", "throughput": 5934.92, "total_tokens": 3793816} {"current_steps": 5835, "total_steps": 33920, "loss": 0.5455, "lr": 9.842946514949197e-06, "epoch": 3.4404481132075473, "percentage": 17.2, "elapsed_time": "0:10:39", "remaining_time": "0:51:19", "throughput": 5934.21, "total_tokens": 3796248} {"current_steps": 5840, "total_steps": 33920, "loss": 0.5237, "lr": 9.842306127445279e-06, "epoch": 3.4433962264150946, "percentage": 17.22, "elapsed_time": "0:10:40", "remaining_time": "0:51:18", "throughput": 5934.12, "total_tokens": 3799000} {"current_steps": 5845, "total_steps": 33920, "loss": 0.4977, "lr": 9.841664457919944e-06, "epoch": 3.4463443396226414, "percentage": 17.23, "elapsed_time": "0:10:40", "remaining_time": "0:51:17", "throughput": 5934.19, "total_tokens": 3801976} {"current_steps": 5850, "total_steps": 33920, "loss": 0.544, "lr": 9.841021506543079e-06, "epoch": 3.4492924528301887, "percentage": 17.25, "elapsed_time": "0:10:41", "remaining_time": "0:51:16", "throughput": 5934.64, "total_tokens": 3805432} {"current_steps": 5855, "total_steps": 33920, "loss": 0.4171, "lr": 9.840377273484904e-06, "epoch": 3.452240566037736, "percentage": 17.26, "elapsed_time": "0:10:41", "remaining_time": "0:51:16", "throughput": 5935.07, "total_tokens": 3809144} {"current_steps": 5860, "total_steps": 33920, "loss": 0.5361, "lr": 9.839731758915986e-06, "epoch": 3.455188679245283, "percentage": 17.28, "elapsed_time": "0:10:42", "remaining_time": "0:51:15", "throughput": 5935.29, "total_tokens": 3812472} {"current_steps": 5865, "total_steps": 33920, "loss": 0.4048, "lr": 9.839084963007226e-06, "epoch": 3.45813679245283, "percentage": 17.29, "elapsed_time": "0:10:42", "remaining_time": "0:51:15", "throughput": 5935.16, "total_tokens": 3815512} {"current_steps": 5870, "total_steps": 33920, "loss": 0.7297, "lr": 9.838436885929868e-06, "epoch": 3.4610849056603774, "percentage": 17.31, "elapsed_time": "0:10:43", "remaining_time": "0:51:14", "throughput": 5934.55, "total_tokens": 3817816} {"current_steps": 5875, "total_steps": 33920, "loss": 0.363, "lr": 9.837787527855492e-06, "epoch": 3.4640330188679247, "percentage": 17.32, "elapsed_time": "0:10:43", "remaining_time": "0:51:13", "throughput": 5934.35, "total_tokens": 3820568} {"current_steps": 5880, "total_steps": 33920, "loss": 0.4708, "lr": 9.837136888956017e-06, "epoch": 3.4669811320754715, "percentage": 17.33, "elapsed_time": "0:10:44", "remaining_time": "0:51:12", "throughput": 5934.95, "total_tokens": 3824088} {"current_steps": 5885, "total_steps": 33920, "loss": 0.4792, "lr": 9.836484969403705e-06, "epoch": 3.469929245283019, "percentage": 17.35, "elapsed_time": "0:10:44", "remaining_time": "0:51:11", "throughput": 5935.08, "total_tokens": 3827192} {"current_steps": 5890, "total_steps": 33920, "loss": 0.4112, "lr": 9.835831769371152e-06, "epoch": 3.472877358490566, "percentage": 17.36, "elapsed_time": "0:10:45", "remaining_time": "0:51:10", "throughput": 5934.29, "total_tokens": 3829400} {"current_steps": 5895, "total_steps": 33920, "loss": 0.4544, "lr": 9.835177289031298e-06, "epoch": 3.4758254716981134, "percentage": 17.38, "elapsed_time": "0:10:45", "remaining_time": "0:51:09", "throughput": 5933.44, "total_tokens": 3831480} {"current_steps": 5900, "total_steps": 33920, "loss": 0.5183, "lr": 9.834521528557419e-06, "epoch": 3.4787735849056602, "percentage": 17.39, "elapsed_time": "0:10:46", "remaining_time": "0:51:09", "throughput": 5934.02, "total_tokens": 3835032} {"current_steps": 5905, "total_steps": 33920, "loss": 0.3635, "lr": 9.833864488123128e-06, "epoch": 3.4817216981132075, "percentage": 17.41, "elapsed_time": "0:10:46", "remaining_time": "0:51:08", "throughput": 5934.18, "total_tokens": 3838008} {"current_steps": 5910, "total_steps": 33920, "loss": 0.4173, "lr": 9.83320616790238e-06, "epoch": 3.484669811320755, "percentage": 17.42, "elapsed_time": "0:10:47", "remaining_time": "0:51:07", "throughput": 5934.5, "total_tokens": 3841432} {"current_steps": 5915, "total_steps": 33920, "loss": 0.4998, "lr": 9.832546568069472e-06, "epoch": 3.487617924528302, "percentage": 17.44, "elapsed_time": "0:10:47", "remaining_time": "0:51:06", "throughput": 5934.58, "total_tokens": 3844344} {"current_steps": 5920, "total_steps": 33920, "loss": 0.4914, "lr": 9.831885688799031e-06, "epoch": 3.490566037735849, "percentage": 17.45, "elapsed_time": "0:10:48", "remaining_time": "0:51:06", "throughput": 5934.86, "total_tokens": 3847544} {"current_steps": 5925, "total_steps": 33920, "loss": 0.8029, "lr": 9.83122353026603e-06, "epoch": 3.4935141509433962, "percentage": 17.47, "elapsed_time": "0:10:48", "remaining_time": "0:51:05", "throughput": 5934.88, "total_tokens": 3850616} {"current_steps": 5930, "total_steps": 33920, "loss": 0.444, "lr": 9.830560092645778e-06, "epoch": 3.4964622641509435, "percentage": 17.48, "elapsed_time": "0:10:49", "remaining_time": "0:51:05", "throughput": 5935.16, "total_tokens": 3854104} {"current_steps": 5935, "total_steps": 33920, "loss": 0.4993, "lr": 9.829895376113923e-06, "epoch": 3.4994103773584904, "percentage": 17.5, "elapsed_time": "0:10:49", "remaining_time": "0:51:04", "throughput": 5936.09, "total_tokens": 3858296} {"current_steps": 5940, "total_steps": 33920, "loss": 0.4349, "lr": 9.829229380846452e-06, "epoch": 3.5023584905660377, "percentage": 17.51, "elapsed_time": "0:10:50", "remaining_time": "0:51:03", "throughput": 5935.81, "total_tokens": 3860952} {"current_steps": 5945, "total_steps": 33920, "loss": 0.5228, "lr": 9.82856210701969e-06, "epoch": 3.505306603773585, "percentage": 17.53, "elapsed_time": "0:10:50", "remaining_time": "0:51:03", "throughput": 5935.81, "total_tokens": 3863800} {"current_steps": 5950, "total_steps": 33920, "loss": 0.5692, "lr": 9.827893554810298e-06, "epoch": 3.5082547169811322, "percentage": 17.54, "elapsed_time": "0:10:51", "remaining_time": "0:51:02", "throughput": 5936.54, "total_tokens": 3867800} {"current_steps": 5955, "total_steps": 33920, "loss": 0.5173, "lr": 9.827223724395281e-06, "epoch": 3.5112028301886795, "percentage": 17.56, "elapsed_time": "0:10:52", "remaining_time": "0:51:01", "throughput": 5936.09, "total_tokens": 3870360} {"current_steps": 5960, "total_steps": 33920, "loss": 0.4577, "lr": 9.82655261595198e-06, "epoch": 3.5141509433962264, "percentage": 17.57, "elapsed_time": "0:10:52", "remaining_time": "0:51:01", "throughput": 5935.99, "total_tokens": 3873432} {"current_steps": 5965, "total_steps": 33920, "loss": 0.5061, "lr": 9.825880229658073e-06, "epoch": 3.5170990566037736, "percentage": 17.59, "elapsed_time": "0:10:53", "remaining_time": "0:51:00", "throughput": 5936.12, "total_tokens": 3876376} {"current_steps": 5970, "total_steps": 33920, "loss": 0.5066, "lr": 9.825206565691576e-06, "epoch": 3.5200471698113205, "percentage": 17.6, "elapsed_time": "0:10:53", "remaining_time": "0:50:59", "throughput": 5936.3, "total_tokens": 3879352} {"current_steps": 5975, "total_steps": 33920, "loss": 0.4673, "lr": 9.824531624230844e-06, "epoch": 3.5229952830188678, "percentage": 17.61, "elapsed_time": "0:10:54", "remaining_time": "0:50:58", "throughput": 5936.6, "total_tokens": 3882712} {"current_steps": 5980, "total_steps": 33920, "loss": 0.5376, "lr": 9.823855405454573e-06, "epoch": 3.525943396226415, "percentage": 17.63, "elapsed_time": "0:10:54", "remaining_time": "0:50:58", "throughput": 5936.8, "total_tokens": 3886072} {"current_steps": 5985, "total_steps": 33920, "loss": 0.4141, "lr": 9.823177909541795e-06, "epoch": 3.5288915094339623, "percentage": 17.64, "elapsed_time": "0:10:55", "remaining_time": "0:50:57", "throughput": 5936.85, "total_tokens": 3889304} {"current_steps": 5990, "total_steps": 33920, "loss": 0.3906, "lr": 9.822499136671877e-06, "epoch": 3.5318396226415096, "percentage": 17.66, "elapsed_time": "0:10:55", "remaining_time": "0:50:57", "throughput": 5937.11, "total_tokens": 3892600} {"current_steps": 5995, "total_steps": 33920, "loss": 0.4666, "lr": 9.82181908702453e-06, "epoch": 3.5347877358490565, "percentage": 17.67, "elapsed_time": "0:10:56", "remaining_time": "0:50:56", "throughput": 5937.34, "total_tokens": 3895992} {"current_steps": 6000, "total_steps": 33920, "loss": 0.6857, "lr": 9.821137760779797e-06, "epoch": 3.5377358490566038, "percentage": 17.69, "elapsed_time": "0:10:56", "remaining_time": "0:50:55", "throughput": 5937.93, "total_tokens": 3899480} {"current_steps": 6005, "total_steps": 33920, "loss": 0.4807, "lr": 9.820455158118065e-06, "epoch": 3.540683962264151, "percentage": 17.7, "elapsed_time": "0:10:57", "remaining_time": "0:50:54", "throughput": 5937.52, "total_tokens": 3901880} {"current_steps": 6010, "total_steps": 33920, "loss": 0.4873, "lr": 9.819771279220053e-06, "epoch": 3.543632075471698, "percentage": 17.72, "elapsed_time": "0:10:57", "remaining_time": "0:50:55", "throughput": 5938.6, "total_tokens": 3906808} {"current_steps": 6015, "total_steps": 33920, "loss": 0.4121, "lr": 9.819086124266825e-06, "epoch": 3.546580188679245, "percentage": 17.73, "elapsed_time": "0:10:58", "remaining_time": "0:50:54", "throughput": 5938.67, "total_tokens": 3910296} {"current_steps": 6020, "total_steps": 33920, "loss": 0.5161, "lr": 9.818399693439778e-06, "epoch": 3.5495283018867925, "percentage": 17.75, "elapsed_time": "0:10:58", "remaining_time": "0:50:53", "throughput": 5938.85, "total_tokens": 3913400} {"current_steps": 6025, "total_steps": 33920, "loss": 0.4391, "lr": 9.817711986920644e-06, "epoch": 3.5524764150943398, "percentage": 17.76, "elapsed_time": "0:10:59", "remaining_time": "0:50:52", "throughput": 5938.5, "total_tokens": 3915896} {"current_steps": 6030, "total_steps": 33920, "loss": 0.4052, "lr": 9.817023004891497e-06, "epoch": 3.555424528301887, "percentage": 17.78, "elapsed_time": "0:10:59", "remaining_time": "0:50:52", "throughput": 5938.97, "total_tokens": 3919352} {"current_steps": 6035, "total_steps": 33920, "loss": 0.6553, "lr": 9.816332747534752e-06, "epoch": 3.558372641509434, "percentage": 17.79, "elapsed_time": "0:11:00", "remaining_time": "0:50:51", "throughput": 5937.85, "total_tokens": 3921560} {"current_steps": 6040, "total_steps": 33920, "loss": 0.6066, "lr": 9.815641215033153e-06, "epoch": 3.561320754716981, "percentage": 17.81, "elapsed_time": "0:11:00", "remaining_time": "0:50:50", "throughput": 5938.13, "total_tokens": 3924824} {"current_steps": 6045, "total_steps": 33920, "loss": 0.4676, "lr": 9.814948407569789e-06, "epoch": 3.5642688679245285, "percentage": 17.82, "elapsed_time": "0:11:01", "remaining_time": "0:50:50", "throughput": 5938.54, "total_tokens": 3928216} {"current_steps": 6050, "total_steps": 33920, "loss": 0.8209, "lr": 9.814254325328082e-06, "epoch": 3.5672169811320753, "percentage": 17.84, "elapsed_time": "0:11:01", "remaining_time": "0:50:49", "throughput": 5938.65, "total_tokens": 3931192} {"current_steps": 6055, "total_steps": 33920, "loss": 0.3313, "lr": 9.813558968491794e-06, "epoch": 3.5701650943396226, "percentage": 17.85, "elapsed_time": "0:11:02", "remaining_time": "0:50:48", "throughput": 5938.71, "total_tokens": 3934072} {"current_steps": 6060, "total_steps": 33920, "loss": 0.4213, "lr": 9.812862337245024e-06, "epoch": 3.57311320754717, "percentage": 17.87, "elapsed_time": "0:11:02", "remaining_time": "0:50:47", "throughput": 5938.74, "total_tokens": 3937048} {"current_steps": 6065, "total_steps": 33920, "loss": 0.4467, "lr": 9.812164431772208e-06, "epoch": 3.576061320754717, "percentage": 17.88, "elapsed_time": "0:11:03", "remaining_time": "0:50:47", "throughput": 5939.07, "total_tokens": 3940472} {"current_steps": 6070, "total_steps": 33920, "loss": 0.4232, "lr": 9.81146525225812e-06, "epoch": 3.579009433962264, "percentage": 17.9, "elapsed_time": "0:11:03", "remaining_time": "0:50:46", "throughput": 5939.17, "total_tokens": 3943352} {"current_steps": 6075, "total_steps": 33920, "loss": 0.4158, "lr": 9.810764798887868e-06, "epoch": 3.5819575471698113, "percentage": 17.91, "elapsed_time": "0:11:04", "remaining_time": "0:50:46", "throughput": 5940.1, "total_tokens": 3948120} {"current_steps": 6080, "total_steps": 33920, "loss": 0.4391, "lr": 9.810063071846905e-06, "epoch": 3.5849056603773586, "percentage": 17.92, "elapsed_time": "0:11:05", "remaining_time": "0:50:46", "throughput": 5939.91, "total_tokens": 3951640} {"current_steps": 6085, "total_steps": 33920, "loss": 0.5251, "lr": 9.809360071321013e-06, "epoch": 3.5878537735849054, "percentage": 17.94, "elapsed_time": "0:11:05", "remaining_time": "0:50:45", "throughput": 5939.45, "total_tokens": 3954232} {"current_steps": 6090, "total_steps": 33920, "loss": 0.3834, "lr": 9.808655797496314e-06, "epoch": 3.5908018867924527, "percentage": 17.95, "elapsed_time": "0:11:06", "remaining_time": "0:50:44", "throughput": 5939.62, "total_tokens": 3957592} {"current_steps": 6095, "total_steps": 33920, "loss": 0.4787, "lr": 9.807950250559268e-06, "epoch": 3.59375, "percentage": 17.97, "elapsed_time": "0:11:06", "remaining_time": "0:50:43", "throughput": 5939.64, "total_tokens": 3960408} {"current_steps": 6100, "total_steps": 33920, "loss": 0.4039, "lr": 9.807243430696673e-06, "epoch": 3.5966981132075473, "percentage": 17.98, "elapsed_time": "0:11:07", "remaining_time": "0:50:43", "throughput": 5939.94, "total_tokens": 3963768} {"current_steps": 6105, "total_steps": 33920, "loss": 0.3762, "lr": 9.806535338095661e-06, "epoch": 3.5996462264150946, "percentage": 18.0, "elapsed_time": "0:11:07", "remaining_time": "0:50:42", "throughput": 5940.27, "total_tokens": 3967128} {"current_steps": 6110, "total_steps": 33920, "loss": 0.4224, "lr": 9.805825972943706e-06, "epoch": 3.6025943396226414, "percentage": 18.01, "elapsed_time": "0:11:08", "remaining_time": "0:50:41", "throughput": 5939.31, "total_tokens": 3969304} {"current_steps": 6115, "total_steps": 33920, "loss": 0.3702, "lr": 9.80511533542861e-06, "epoch": 3.6055424528301887, "percentage": 18.03, "elapsed_time": "0:11:08", "remaining_time": "0:50:41", "throughput": 5939.03, "total_tokens": 3972024} {"current_steps": 6120, "total_steps": 33920, "loss": 0.4523, "lr": 9.80440342573852e-06, "epoch": 3.608490566037736, "percentage": 18.04, "elapsed_time": "0:11:09", "remaining_time": "0:50:40", "throughput": 5938.97, "total_tokens": 3975032} {"current_steps": 6125, "total_steps": 33920, "loss": 0.4127, "lr": 9.803690244061919e-06, "epoch": 3.611438679245283, "percentage": 18.06, "elapsed_time": "0:11:09", "remaining_time": "0:50:39", "throughput": 5939.01, "total_tokens": 3977944} {"current_steps": 6130, "total_steps": 33920, "loss": 0.4905, "lr": 9.802975790587621e-06, "epoch": 3.61438679245283, "percentage": 18.07, "elapsed_time": "0:11:10", "remaining_time": "0:50:38", "throughput": 5939.44, "total_tokens": 3981304} {"current_steps": 6135, "total_steps": 33920, "loss": 0.5802, "lr": 9.802260065504783e-06, "epoch": 3.6173349056603774, "percentage": 18.09, "elapsed_time": "0:11:10", "remaining_time": "0:50:38", "throughput": 5939.67, "total_tokens": 3984792} {"current_steps": 6140, "total_steps": 33920, "loss": 0.3999, "lr": 9.801543069002897e-06, "epoch": 3.6202830188679247, "percentage": 18.1, "elapsed_time": "0:11:11", "remaining_time": "0:50:37", "throughput": 5939.72, "total_tokens": 3987832} {"current_steps": 6145, "total_steps": 33920, "loss": 0.3942, "lr": 9.80082480127179e-06, "epoch": 3.6232311320754715, "percentage": 18.12, "elapsed_time": "0:11:12", "remaining_time": "0:50:37", "throughput": 5940.02, "total_tokens": 3991800} {"current_steps": 6150, "total_steps": 33920, "loss": 0.4654, "lr": 9.800105262501628e-06, "epoch": 3.626179245283019, "percentage": 18.13, "elapsed_time": "0:11:12", "remaining_time": "0:50:36", "throughput": 5940.39, "total_tokens": 3995096} {"current_steps": 6155, "total_steps": 33920, "loss": 0.479, "lr": 9.799384452882907e-06, "epoch": 3.629127358490566, "percentage": 18.15, "elapsed_time": "0:11:13", "remaining_time": "0:50:35", "throughput": 5940.2, "total_tokens": 3997880} {"current_steps": 6160, "total_steps": 33920, "loss": 0.4028, "lr": 9.798662372606469e-06, "epoch": 3.632075471698113, "percentage": 18.16, "elapsed_time": "0:11:13", "remaining_time": "0:50:35", "throughput": 5940.49, "total_tokens": 4001400} {"current_steps": 6165, "total_steps": 33920, "loss": 0.4583, "lr": 9.797939021863487e-06, "epoch": 3.6350235849056602, "percentage": 18.18, "elapsed_time": "0:11:14", "remaining_time": "0:50:34", "throughput": 5940.39, "total_tokens": 4004344} {"current_steps": 6170, "total_steps": 33920, "loss": 0.6341, "lr": 9.797214400845472e-06, "epoch": 3.6379716981132075, "percentage": 18.19, "elapsed_time": "0:11:14", "remaining_time": "0:50:34", "throughput": 5940.29, "total_tokens": 4007416} {"current_steps": 6175, "total_steps": 33920, "loss": 0.5083, "lr": 9.796488509744269e-06, "epoch": 3.640919811320755, "percentage": 18.2, "elapsed_time": "0:11:15", "remaining_time": "0:50:33", "throughput": 5940.05, "total_tokens": 4010488} {"current_steps": 6180, "total_steps": 33920, "loss": 0.5237, "lr": 9.79576134875206e-06, "epoch": 3.643867924528302, "percentage": 18.22, "elapsed_time": "0:11:15", "remaining_time": "0:50:32", "throughput": 5939.75, "total_tokens": 4013144} {"current_steps": 6185, "total_steps": 33920, "loss": 0.512, "lr": 9.795032918061367e-06, "epoch": 3.646816037735849, "percentage": 18.23, "elapsed_time": "0:11:16", "remaining_time": "0:50:32", "throughput": 5939.63, "total_tokens": 4016312} {"current_steps": 6190, "total_steps": 33920, "loss": 0.5066, "lr": 9.794303217865041e-06, "epoch": 3.6497641509433962, "percentage": 18.25, "elapsed_time": "0:11:16", "remaining_time": "0:50:31", "throughput": 5939.99, "total_tokens": 4019896} {"current_steps": 6195, "total_steps": 33920, "loss": 0.5833, "lr": 9.79357224835628e-06, "epoch": 3.6527122641509435, "percentage": 18.26, "elapsed_time": "0:11:17", "remaining_time": "0:50:30", "throughput": 5940.25, "total_tokens": 4022872} {"current_steps": 6200, "total_steps": 33920, "loss": 0.4617, "lr": 9.792840009728605e-06, "epoch": 3.6556603773584904, "percentage": 18.28, "elapsed_time": "0:11:17", "remaining_time": "0:50:30", "throughput": 5940.36, "total_tokens": 4025912} {"current_steps": 6205, "total_steps": 33920, "loss": 0.4697, "lr": 9.79210650217588e-06, "epoch": 3.6586084905660377, "percentage": 18.29, "elapsed_time": "0:11:18", "remaining_time": "0:50:29", "throughput": 5940.76, "total_tokens": 4029208} {"current_steps": 6210, "total_steps": 33920, "loss": 0.5245, "lr": 9.791371725892307e-06, "epoch": 3.661556603773585, "percentage": 18.31, "elapsed_time": "0:11:18", "remaining_time": "0:50:28", "throughput": 5940.68, "total_tokens": 4032120} {"current_steps": 6215, "total_steps": 33920, "loss": 0.4678, "lr": 9.79063568107242e-06, "epoch": 3.6645047169811322, "percentage": 18.32, "elapsed_time": "0:11:19", "remaining_time": "0:50:28", "throughput": 5940.96, "total_tokens": 4035576} {"current_steps": 6220, "total_steps": 33920, "loss": 0.4948, "lr": 9.78989836791109e-06, "epoch": 3.6674528301886795, "percentage": 18.34, "elapsed_time": "0:11:19", "remaining_time": "0:50:27", "throughput": 5941.28, "total_tokens": 4039096} {"current_steps": 6225, "total_steps": 33920, "loss": 0.4846, "lr": 9.789159786603524e-06, "epoch": 3.6704009433962264, "percentage": 18.35, "elapsed_time": "0:11:20", "remaining_time": "0:50:28", "throughput": 5942.44, "total_tokens": 4045720} {"current_steps": 6230, "total_steps": 33920, "loss": 0.5236, "lr": 9.788419937345263e-06, "epoch": 3.6733490566037736, "percentage": 18.37, "elapsed_time": "0:11:21", "remaining_time": "0:50:28", "throughput": 5942.39, "total_tokens": 4048760} {"current_steps": 6235, "total_steps": 33920, "loss": 0.5792, "lr": 9.787678820332188e-06, "epoch": 3.6762971698113205, "percentage": 18.38, "elapsed_time": "0:11:21", "remaining_time": "0:50:27", "throughput": 5942.57, "total_tokens": 4052408} {"current_steps": 6240, "total_steps": 33920, "loss": 0.3448, "lr": 9.78693643576051e-06, "epoch": 3.6792452830188678, "percentage": 18.4, "elapsed_time": "0:11:22", "remaining_time": "0:50:27", "throughput": 5942.07, "total_tokens": 4054872} {"current_steps": 6245, "total_steps": 33920, "loss": 0.4117, "lr": 9.786192783826782e-06, "epoch": 3.682193396226415, "percentage": 18.41, "elapsed_time": "0:11:22", "remaining_time": "0:50:26", "throughput": 5941.41, "total_tokens": 4057304} {"current_steps": 6250, "total_steps": 33920, "loss": 0.4217, "lr": 9.785447864727887e-06, "epoch": 3.6851415094339623, "percentage": 18.43, "elapsed_time": "0:11:23", "remaining_time": "0:50:25", "throughput": 5941.11, "total_tokens": 4060056} {"current_steps": 6255, "total_steps": 33920, "loss": 0.45, "lr": 9.784701678661045e-06, "epoch": 3.6880896226415096, "percentage": 18.44, "elapsed_time": "0:11:23", "remaining_time": "0:50:24", "throughput": 5940.88, "total_tokens": 4062808} {"current_steps": 6260, "total_steps": 33920, "loss": 0.3605, "lr": 9.783954225823813e-06, "epoch": 3.6910377358490565, "percentage": 18.46, "elapsed_time": "0:11:24", "remaining_time": "0:50:24", "throughput": 5941.31, "total_tokens": 4066360} {"current_steps": 6265, "total_steps": 33920, "loss": 0.6737, "lr": 9.783205506414082e-06, "epoch": 3.6939858490566038, "percentage": 18.47, "elapsed_time": "0:11:25", "remaining_time": "0:50:24", "throughput": 5942.28, "total_tokens": 4071352} {"current_steps": 6270, "total_steps": 33920, "loss": 0.4795, "lr": 9.782455520630079e-06, "epoch": 3.696933962264151, "percentage": 18.48, "elapsed_time": "0:11:25", "remaining_time": "0:50:25", "throughput": 5943.2, "total_tokens": 4076952} {"current_steps": 6275, "total_steps": 33920, "loss": 0.5517, "lr": 9.781704268670364e-06, "epoch": 3.699882075471698, "percentage": 18.5, "elapsed_time": "0:11:26", "remaining_time": "0:50:24", "throughput": 5943.67, "total_tokens": 4080952} {"current_steps": 6280, "total_steps": 33920, "loss": 0.4417, "lr": 9.780951750733837e-06, "epoch": 3.702830188679245, "percentage": 18.51, "elapsed_time": "0:11:27", "remaining_time": "0:50:24", "throughput": 5944.24, "total_tokens": 4084888} {"current_steps": 6285, "total_steps": 33920, "loss": 0.414, "lr": 9.780197967019728e-06, "epoch": 3.7057783018867925, "percentage": 18.53, "elapsed_time": "0:11:27", "remaining_time": "0:50:23", "throughput": 5944.09, "total_tokens": 4087640} {"current_steps": 6290, "total_steps": 33920, "loss": 0.5131, "lr": 9.779442917727608e-06, "epoch": 3.7087264150943398, "percentage": 18.54, "elapsed_time": "0:11:28", "remaining_time": "0:50:22", "throughput": 5944.1, "total_tokens": 4090584} {"current_steps": 6295, "total_steps": 33920, "loss": 0.428, "lr": 9.778686603057377e-06, "epoch": 3.711674528301887, "percentage": 18.56, "elapsed_time": "0:11:29", "remaining_time": "0:50:23", "throughput": 5945.03, "total_tokens": 4096248} {"current_steps": 6300, "total_steps": 33920, "loss": 0.5105, "lr": 9.777929023209271e-06, "epoch": 3.714622641509434, "percentage": 18.57, "elapsed_time": "0:11:29", "remaining_time": "0:50:22", "throughput": 5944.78, "total_tokens": 4099000} {"current_steps": 6305, "total_steps": 33920, "loss": 0.4514, "lr": 9.777170178383866e-06, "epoch": 3.717570754716981, "percentage": 18.59, "elapsed_time": "0:11:30", "remaining_time": "0:50:22", "throughput": 5945.09, "total_tokens": 4102968} {"current_steps": 6310, "total_steps": 33920, "loss": 0.4082, "lr": 9.776410068782068e-06, "epoch": 3.7205188679245285, "percentage": 18.6, "elapsed_time": "0:11:30", "remaining_time": "0:50:22", "throughput": 5945.23, "total_tokens": 4106136} {"current_steps": 6315, "total_steps": 33920, "loss": 0.4888, "lr": 9.775648694605118e-06, "epoch": 3.7234669811320753, "percentage": 18.62, "elapsed_time": "0:11:31", "remaining_time": "0:50:21", "throughput": 5945.47, "total_tokens": 4109912} {"current_steps": 6320, "total_steps": 33920, "loss": 0.5083, "lr": 9.774886056054593e-06, "epoch": 3.7264150943396226, "percentage": 18.63, "elapsed_time": "0:11:31", "remaining_time": "0:50:20", "throughput": 5945.66, "total_tokens": 4112920} {"current_steps": 6325, "total_steps": 33920, "loss": 0.4457, "lr": 9.774122153332408e-06, "epoch": 3.72936320754717, "percentage": 18.65, "elapsed_time": "0:11:32", "remaining_time": "0:50:20", "throughput": 5946.02, "total_tokens": 4116152} {"current_steps": 6330, "total_steps": 33920, "loss": 0.4649, "lr": 9.773356986640807e-06, "epoch": 3.732311320754717, "percentage": 18.66, "elapsed_time": "0:11:32", "remaining_time": "0:50:19", "throughput": 5946.74, "total_tokens": 4120280} {"current_steps": 6335, "total_steps": 33920, "loss": 0.4834, "lr": 9.772590556182373e-06, "epoch": 3.735259433962264, "percentage": 18.68, "elapsed_time": "0:11:33", "remaining_time": "0:50:19", "throughput": 5946.45, "total_tokens": 4122840} {"current_steps": 6340, "total_steps": 33920, "loss": 0.3839, "lr": 9.77182286216002e-06, "epoch": 3.7382075471698113, "percentage": 18.69, "elapsed_time": "0:11:33", "remaining_time": "0:50:18", "throughput": 5946.71, "total_tokens": 4126232} {"current_steps": 6345, "total_steps": 33920, "loss": 0.4966, "lr": 9.771053904776998e-06, "epoch": 3.7411556603773586, "percentage": 18.71, "elapsed_time": "0:11:34", "remaining_time": "0:50:17", "throughput": 5946.98, "total_tokens": 4129752} {"current_steps": 6350, "total_steps": 33920, "loss": 0.7019, "lr": 9.770283684236891e-06, "epoch": 3.7441037735849054, "percentage": 18.72, "elapsed_time": "0:11:34", "remaining_time": "0:50:17", "throughput": 5946.71, "total_tokens": 4132280} {"current_steps": 6355, "total_steps": 33920, "loss": 0.4648, "lr": 9.769512200743623e-06, "epoch": 3.7470518867924527, "percentage": 18.74, "elapsed_time": "0:11:35", "remaining_time": "0:50:16", "throughput": 5946.91, "total_tokens": 4135864} {"current_steps": 6360, "total_steps": 33920, "loss": 0.5098, "lr": 9.768739454501444e-06, "epoch": 3.75, "percentage": 18.75, "elapsed_time": "0:11:35", "remaining_time": "0:50:15", "throughput": 5946.88, "total_tokens": 4138680} {"current_steps": 6365, "total_steps": 33920, "loss": 0.4696, "lr": 9.76796544571494e-06, "epoch": 3.7529481132075473, "percentage": 18.76, "elapsed_time": "0:11:36", "remaining_time": "0:50:14", "throughput": 5946.69, "total_tokens": 4141368} {"current_steps": 6370, "total_steps": 33920, "loss": 0.448, "lr": 9.767190174589036e-06, "epoch": 3.7558962264150946, "percentage": 18.78, "elapsed_time": "0:11:36", "remaining_time": "0:50:14", "throughput": 5947.02, "total_tokens": 4144760} {"current_steps": 6375, "total_steps": 33920, "loss": 0.5654, "lr": 9.76641364132899e-06, "epoch": 3.7588443396226414, "percentage": 18.79, "elapsed_time": "0:11:37", "remaining_time": "0:50:13", "throughput": 5946.58, "total_tokens": 4147416} {"current_steps": 6380, "total_steps": 33920, "loss": 0.483, "lr": 9.765635846140389e-06, "epoch": 3.7617924528301887, "percentage": 18.81, "elapsed_time": "0:11:37", "remaining_time": "0:50:12", "throughput": 5946.52, "total_tokens": 4150328} {"current_steps": 6385, "total_steps": 33920, "loss": 0.4791, "lr": 9.764856789229157e-06, "epoch": 3.764740566037736, "percentage": 18.82, "elapsed_time": "0:11:38", "remaining_time": "0:50:12", "throughput": 5946.77, "total_tokens": 4153528} {"current_steps": 6390, "total_steps": 33920, "loss": 0.3479, "lr": 9.764076470801557e-06, "epoch": 3.767688679245283, "percentage": 18.84, "elapsed_time": "0:11:39", "remaining_time": "0:50:13", "throughput": 5947.7, "total_tokens": 4159896} {"current_steps": 6395, "total_steps": 33920, "loss": 0.4897, "lr": 9.763294891064182e-06, "epoch": 3.77063679245283, "percentage": 18.85, "elapsed_time": "0:11:39", "remaining_time": "0:50:12", "throughput": 5947.84, "total_tokens": 4163160} {"current_steps": 6400, "total_steps": 33920, "loss": 0.5124, "lr": 9.762512050223951e-06, "epoch": 3.7735849056603774, "percentage": 18.87, "elapsed_time": "0:11:40", "remaining_time": "0:50:11", "throughput": 5947.92, "total_tokens": 4166168} {"current_steps": 6405, "total_steps": 33920, "loss": 0.4488, "lr": 9.761727948488132e-06, "epoch": 3.7765330188679247, "percentage": 18.88, "elapsed_time": "0:11:40", "remaining_time": "0:50:11", "throughput": 5947.9, "total_tokens": 4169016} {"current_steps": 6410, "total_steps": 33920, "loss": 0.6208, "lr": 9.760942586064315e-06, "epoch": 3.7794811320754715, "percentage": 18.9, "elapsed_time": "0:11:41", "remaining_time": "0:50:10", "throughput": 5948.24, "total_tokens": 4172248} {"current_steps": 6415, "total_steps": 33920, "loss": 0.4391, "lr": 9.760155963160431e-06, "epoch": 3.782429245283019, "percentage": 18.91, "elapsed_time": "0:11:41", "remaining_time": "0:50:09", "throughput": 5948.29, "total_tokens": 4175000} {"current_steps": 6420, "total_steps": 33920, "loss": 0.5175, "lr": 9.759368079984741e-06, "epoch": 3.785377358490566, "percentage": 18.93, "elapsed_time": "0:11:42", "remaining_time": "0:50:08", "throughput": 5948.39, "total_tokens": 4178168} {"current_steps": 6425, "total_steps": 33920, "loss": 0.5281, "lr": 9.758578936745839e-06, "epoch": 3.788325471698113, "percentage": 18.94, "elapsed_time": "0:11:42", "remaining_time": "0:50:08", "throughput": 5948.81, "total_tokens": 4181688} {"current_steps": 6430, "total_steps": 33920, "loss": 0.4679, "lr": 9.757788533652656e-06, "epoch": 3.7912735849056602, "percentage": 18.96, "elapsed_time": "0:11:43", "remaining_time": "0:50:07", "throughput": 5948.97, "total_tokens": 4184728} {"current_steps": 6435, "total_steps": 33920, "loss": 0.3743, "lr": 9.756996870914454e-06, "epoch": 3.7942216981132075, "percentage": 18.97, "elapsed_time": "0:11:44", "remaining_time": "0:50:06", "throughput": 5949.09, "total_tokens": 4188184} {"current_steps": 6440, "total_steps": 33920, "loss": 0.4798, "lr": 9.756203948740828e-06, "epoch": 3.797169811320755, "percentage": 18.99, "elapsed_time": "0:11:44", "remaining_time": "0:50:05", "throughput": 5948.97, "total_tokens": 4190808} {"current_steps": 6445, "total_steps": 33920, "loss": 0.4782, "lr": 9.755409767341709e-06, "epoch": 3.800117924528302, "percentage": 19.0, "elapsed_time": "0:11:45", "remaining_time": "0:50:05", "throughput": 5949.48, "total_tokens": 4194808} {"current_steps": 6450, "total_steps": 33920, "loss": 0.5435, "lr": 9.75461432692736e-06, "epoch": 3.803066037735849, "percentage": 19.02, "elapsed_time": "0:11:45", "remaining_time": "0:50:04", "throughput": 5949.01, "total_tokens": 4197400} {"current_steps": 6455, "total_steps": 33920, "loss": 0.5429, "lr": 9.753817627708375e-06, "epoch": 3.8060141509433962, "percentage": 19.03, "elapsed_time": "0:11:46", "remaining_time": "0:50:03", "throughput": 5948.51, "total_tokens": 4199736} {"current_steps": 6460, "total_steps": 33920, "loss": 0.598, "lr": 9.753019669895686e-06, "epoch": 3.8089622641509435, "percentage": 19.04, "elapsed_time": "0:11:46", "remaining_time": "0:50:03", "throughput": 5948.68, "total_tokens": 4202680} {"current_steps": 6465, "total_steps": 33920, "loss": 0.5387, "lr": 9.752220453700556e-06, "epoch": 3.8119103773584904, "percentage": 19.06, "elapsed_time": "0:11:47", "remaining_time": "0:50:02", "throughput": 5948.32, "total_tokens": 4205464} {"current_steps": 6470, "total_steps": 33920, "loss": 0.5288, "lr": 9.75141997933458e-06, "epoch": 3.8148584905660377, "percentage": 19.07, "elapsed_time": "0:11:47", "remaining_time": "0:50:01", "throughput": 5948.5, "total_tokens": 4208856} {"current_steps": 6475, "total_steps": 33920, "loss": 0.5233, "lr": 9.750618247009685e-06, "epoch": 3.817806603773585, "percentage": 19.09, "elapsed_time": "0:11:48", "remaining_time": "0:50:01", "throughput": 5949.0, "total_tokens": 4212728} {"current_steps": 6480, "total_steps": 33920, "loss": 0.4468, "lr": 9.749815256938138e-06, "epoch": 3.8207547169811322, "percentage": 19.1, "elapsed_time": "0:11:48", "remaining_time": "0:50:00", "throughput": 5949.3, "total_tokens": 4215960} {"current_steps": 6485, "total_steps": 33920, "loss": 0.3658, "lr": 9.749011009332529e-06, "epoch": 3.8237028301886795, "percentage": 19.12, "elapsed_time": "0:11:49", "remaining_time": "0:50:00", "throughput": 5949.42, "total_tokens": 4219096} {"current_steps": 6490, "total_steps": 33920, "loss": 0.4501, "lr": 9.748205504405787e-06, "epoch": 3.8266509433962264, "percentage": 19.13, "elapsed_time": "0:11:49", "remaining_time": "0:49:59", "throughput": 5949.94, "total_tokens": 4223032} {"current_steps": 6495, "total_steps": 33920, "loss": 0.4556, "lr": 9.747398742371177e-06, "epoch": 3.8295990566037736, "percentage": 19.15, "elapsed_time": "0:11:50", "remaining_time": "0:49:59", "throughput": 5949.06, "total_tokens": 4225656} {"current_steps": 6500, "total_steps": 33920, "loss": 0.4178, "lr": 9.746590723442289e-06, "epoch": 3.8325471698113205, "percentage": 19.16, "elapsed_time": "0:11:50", "remaining_time": "0:49:58", "throughput": 5949.66, "total_tokens": 4229720} {"current_steps": 6505, "total_steps": 33920, "loss": 0.3584, "lr": 9.745781447833049e-06, "epoch": 3.8354952830188678, "percentage": 19.18, "elapsed_time": "0:11:51", "remaining_time": "0:49:58", "throughput": 5949.75, "total_tokens": 4233464} {"current_steps": 6510, "total_steps": 33920, "loss": 0.4143, "lr": 9.74497091575772e-06, "epoch": 3.838443396226415, "percentage": 19.19, "elapsed_time": "0:11:52", "remaining_time": "0:49:57", "throughput": 5949.58, "total_tokens": 4236120} {"current_steps": 6515, "total_steps": 33920, "loss": 0.6568, "lr": 9.744159127430888e-06, "epoch": 3.8413915094339623, "percentage": 19.21, "elapsed_time": "0:11:52", "remaining_time": "0:49:57", "throughput": 5949.95, "total_tokens": 4239448} {"current_steps": 6520, "total_steps": 33920, "loss": 0.3596, "lr": 9.743346083067482e-06, "epoch": 3.8443396226415096, "percentage": 19.22, "elapsed_time": "0:11:53", "remaining_time": "0:49:56", "throughput": 5949.91, "total_tokens": 4242616} {"current_steps": 6525, "total_steps": 33920, "loss": 0.5789, "lr": 9.742531782882758e-06, "epoch": 3.8472877358490565, "percentage": 19.24, "elapsed_time": "0:11:53", "remaining_time": "0:49:56", "throughput": 5949.47, "total_tokens": 4245528} {"current_steps": 6530, "total_steps": 33920, "loss": 0.4895, "lr": 9.741716227092305e-06, "epoch": 3.8502358490566038, "percentage": 19.25, "elapsed_time": "0:11:54", "remaining_time": "0:49:55", "throughput": 5948.77, "total_tokens": 4248120} {"current_steps": 6535, "total_steps": 33920, "loss": 0.5454, "lr": 9.740899415912048e-06, "epoch": 3.853183962264151, "percentage": 19.27, "elapsed_time": "0:11:54", "remaining_time": "0:49:54", "throughput": 5948.39, "total_tokens": 4250808} {"current_steps": 6540, "total_steps": 33920, "loss": 0.4629, "lr": 9.740081349558236e-06, "epoch": 3.856132075471698, "percentage": 19.28, "elapsed_time": "0:11:55", "remaining_time": "0:49:54", "throughput": 5948.67, "total_tokens": 4254328} {"current_steps": 6545, "total_steps": 33920, "loss": 0.6465, "lr": 9.739262028247459e-06, "epoch": 3.859080188679245, "percentage": 19.3, "elapsed_time": "0:11:55", "remaining_time": "0:49:54", "throughput": 5949.97, "total_tokens": 4260024} {"current_steps": 6550, "total_steps": 33920, "loss": 0.3888, "lr": 9.738441452196633e-06, "epoch": 3.8620283018867925, "percentage": 19.31, "elapsed_time": "0:11:56", "remaining_time": "0:49:53", "throughput": 5949.88, "total_tokens": 4262680} {"current_steps": 6555, "total_steps": 33920, "loss": 0.4758, "lr": 9.737619621623013e-06, "epoch": 3.8649764150943398, "percentage": 19.32, "elapsed_time": "0:11:56", "remaining_time": "0:49:53", "throughput": 5949.63, "total_tokens": 4265784} {"current_steps": 6560, "total_steps": 33920, "loss": 0.5636, "lr": 9.73679653674418e-06, "epoch": 3.867924528301887, "percentage": 19.34, "elapsed_time": "0:11:57", "remaining_time": "0:49:52", "throughput": 5949.71, "total_tokens": 4268792} {"current_steps": 6565, "total_steps": 33920, "loss": 0.5459, "lr": 9.735972197778047e-06, "epoch": 3.870872641509434, "percentage": 19.35, "elapsed_time": "0:11:57", "remaining_time": "0:49:51", "throughput": 5949.45, "total_tokens": 4271576} {"current_steps": 6570, "total_steps": 33920, "loss": 0.3232, "lr": 9.735146604942867e-06, "epoch": 3.873820754716981, "percentage": 19.37, "elapsed_time": "0:11:58", "remaining_time": "0:49:50", "throughput": 5949.27, "total_tokens": 4274360} {"current_steps": 6575, "total_steps": 33920, "loss": 0.4813, "lr": 9.734319758457214e-06, "epoch": 3.8767688679245285, "percentage": 19.38, "elapsed_time": "0:11:58", "remaining_time": "0:49:50", "throughput": 5949.09, "total_tokens": 4277144} {"current_steps": 6580, "total_steps": 33920, "loss": 0.4674, "lr": 9.733491658540001e-06, "epoch": 3.8797169811320753, "percentage": 19.4, "elapsed_time": "0:11:59", "remaining_time": "0:49:49", "throughput": 5949.17, "total_tokens": 4280184} {"current_steps": 6585, "total_steps": 33920, "loss": 0.4806, "lr": 9.732662305410474e-06, "epoch": 3.8826650943396226, "percentage": 19.41, "elapsed_time": "0:11:59", "remaining_time": "0:49:48", "throughput": 5948.88, "total_tokens": 4282616} {"current_steps": 6590, "total_steps": 33920, "loss": 0.7064, "lr": 9.731831699288203e-06, "epoch": 3.88561320754717, "percentage": 19.43, "elapsed_time": "0:12:00", "remaining_time": "0:49:47", "throughput": 5949.07, "total_tokens": 4286072} {"current_steps": 6595, "total_steps": 33920, "loss": 0.4256, "lr": 9.730999840393096e-06, "epoch": 3.888561320754717, "percentage": 19.44, "elapsed_time": "0:12:00", "remaining_time": "0:49:47", "throughput": 5949.52, "total_tokens": 4289496} {"current_steps": 6600, "total_steps": 33920, "loss": 0.4116, "lr": 9.730166728945391e-06, "epoch": 3.891509433962264, "percentage": 19.46, "elapsed_time": "0:12:01", "remaining_time": "0:49:46", "throughput": 5949.48, "total_tokens": 4292280} {"current_steps": 6605, "total_steps": 33920, "loss": 0.5178, "lr": 9.72933236516566e-06, "epoch": 3.8944575471698113, "percentage": 19.47, "elapsed_time": "0:12:01", "remaining_time": "0:49:45", "throughput": 5949.23, "total_tokens": 4295096} {"current_steps": 6610, "total_steps": 33920, "loss": 0.434, "lr": 9.728496749274806e-06, "epoch": 3.8974056603773586, "percentage": 19.49, "elapsed_time": "0:12:02", "remaining_time": "0:49:45", "throughput": 5949.97, "total_tokens": 4299288} {"current_steps": 6615, "total_steps": 33920, "loss": 0.5354, "lr": 9.727659881494054e-06, "epoch": 3.9003537735849054, "percentage": 19.5, "elapsed_time": "0:12:03", "remaining_time": "0:49:45", "throughput": 5951.0, "total_tokens": 4304376} {"current_steps": 6620, "total_steps": 33920, "loss": 0.5407, "lr": 9.726821762044975e-06, "epoch": 3.9033018867924527, "percentage": 19.52, "elapsed_time": "0:12:04", "remaining_time": "0:49:45", "throughput": 5952.01, "total_tokens": 4309432} {"current_steps": 6625, "total_steps": 33920, "loss": 0.4264, "lr": 9.725982391149465e-06, "epoch": 3.90625, "percentage": 19.53, "elapsed_time": "0:12:04", "remaining_time": "0:49:45", "throughput": 5952.45, "total_tokens": 4313432} {"current_steps": 6630, "total_steps": 33920, "loss": 0.4589, "lr": 9.725141769029747e-06, "epoch": 3.9091981132075473, "percentage": 19.55, "elapsed_time": "0:12:05", "remaining_time": "0:49:45", "throughput": 5953.17, "total_tokens": 4317464} {"current_steps": 6635, "total_steps": 33920, "loss": 0.4014, "lr": 9.72429989590838e-06, "epoch": 3.9121462264150946, "percentage": 19.56, "elapsed_time": "0:12:05", "remaining_time": "0:49:44", "throughput": 5953.13, "total_tokens": 4320280} {"current_steps": 6640, "total_steps": 33920, "loss": 0.5671, "lr": 9.723456772008257e-06, "epoch": 3.9150943396226414, "percentage": 19.58, "elapsed_time": "0:12:06", "remaining_time": "0:49:43", "throughput": 5953.45, "total_tokens": 4323576} {"current_steps": 6645, "total_steps": 33920, "loss": 0.3822, "lr": 9.722612397552598e-06, "epoch": 3.9180424528301887, "percentage": 19.59, "elapsed_time": "0:12:06", "remaining_time": "0:49:42", "throughput": 5953.58, "total_tokens": 4326616} {"current_steps": 6650, "total_steps": 33920, "loss": 0.5446, "lr": 9.72176677276495e-06, "epoch": 3.920990566037736, "percentage": 19.6, "elapsed_time": "0:12:07", "remaining_time": "0:49:42", "throughput": 5953.71, "total_tokens": 4330168} {"current_steps": 6655, "total_steps": 33920, "loss": 0.4958, "lr": 9.7209198978692e-06, "epoch": 3.923938679245283, "percentage": 19.62, "elapsed_time": "0:12:07", "remaining_time": "0:49:41", "throughput": 5954.09, "total_tokens": 4333464} {"current_steps": 6660, "total_steps": 33920, "loss": 0.6165, "lr": 9.720071773089564e-06, "epoch": 3.92688679245283, "percentage": 19.63, "elapsed_time": "0:12:08", "remaining_time": "0:49:40", "throughput": 5954.32, "total_tokens": 4336504} {"current_steps": 6665, "total_steps": 33920, "loss": 0.4006, "lr": 9.71922239865058e-06, "epoch": 3.9298349056603774, "percentage": 19.65, "elapsed_time": "0:12:08", "remaining_time": "0:49:40", "throughput": 5954.83, "total_tokens": 4340088} {"current_steps": 6670, "total_steps": 33920, "loss": 0.3981, "lr": 9.718371774777131e-06, "epoch": 3.9327830188679247, "percentage": 19.66, "elapsed_time": "0:12:09", "remaining_time": "0:49:40", "throughput": 5955.51, "total_tokens": 4344120} {"current_steps": 6675, "total_steps": 33920, "loss": 0.6055, "lr": 9.717519901694416e-06, "epoch": 3.9357311320754715, "percentage": 19.68, "elapsed_time": "0:12:09", "remaining_time": "0:49:39", "throughput": 5956.17, "total_tokens": 4347928} {"current_steps": 6680, "total_steps": 33920, "loss": 0.5198, "lr": 9.716666779627978e-06, "epoch": 3.938679245283019, "percentage": 19.69, "elapsed_time": "0:12:10", "remaining_time": "0:49:38", "throughput": 5956.24, "total_tokens": 4351192} {"current_steps": 6685, "total_steps": 33920, "loss": 0.4781, "lr": 9.715812408803681e-06, "epoch": 3.941627358490566, "percentage": 19.71, "elapsed_time": "0:12:11", "remaining_time": "0:49:38", "throughput": 5955.63, "total_tokens": 4353592} {"current_steps": 6690, "total_steps": 33920, "loss": 0.4144, "lr": 9.714956789447726e-06, "epoch": 3.944575471698113, "percentage": 19.72, "elapsed_time": "0:12:11", "remaining_time": "0:49:37", "throughput": 5955.78, "total_tokens": 4356632} {"current_steps": 6695, "total_steps": 33920, "loss": 0.3851, "lr": 9.71409992178664e-06, "epoch": 3.9475235849056602, "percentage": 19.74, "elapsed_time": "0:12:11", "remaining_time": "0:49:36", "throughput": 5956.11, "total_tokens": 4359864} {"current_steps": 6700, "total_steps": 33920, "loss": 0.4902, "lr": 9.713241806047282e-06, "epoch": 3.9504716981132075, "percentage": 19.75, "elapsed_time": "0:12:12", "remaining_time": "0:49:36", "throughput": 5956.55, "total_tokens": 4363480} {"current_steps": 6705, "total_steps": 33920, "loss": 0.5751, "lr": 9.712382442456845e-06, "epoch": 3.953419811320755, "percentage": 19.77, "elapsed_time": "0:12:13", "remaining_time": "0:49:35", "throughput": 5957.12, "total_tokens": 4367544} {"current_steps": 6710, "total_steps": 33920, "loss": 0.4691, "lr": 9.711521831242846e-06, "epoch": 3.956367924528302, "percentage": 19.78, "elapsed_time": "0:12:13", "remaining_time": "0:49:35", "throughput": 5957.29, "total_tokens": 4370712} {"current_steps": 6715, "total_steps": 33920, "loss": 0.3743, "lr": 9.710659972633137e-06, "epoch": 3.959316037735849, "percentage": 19.8, "elapsed_time": "0:12:14", "remaining_time": "0:49:34", "throughput": 5957.49, "total_tokens": 4374136} {"current_steps": 6720, "total_steps": 33920, "loss": 0.3075, "lr": 9.709796866855899e-06, "epoch": 3.9622641509433962, "percentage": 19.81, "elapsed_time": "0:12:14", "remaining_time": "0:49:33", "throughput": 5957.49, "total_tokens": 4376984} {"current_steps": 6725, "total_steps": 33920, "loss": 0.5512, "lr": 9.70893251413964e-06, "epoch": 3.9652122641509435, "percentage": 19.83, "elapsed_time": "0:12:15", "remaining_time": "0:49:33", "throughput": 5957.89, "total_tokens": 4380664} {"current_steps": 6730, "total_steps": 33920, "loss": 0.5348, "lr": 9.708066914713205e-06, "epoch": 3.9681603773584904, "percentage": 19.84, "elapsed_time": "0:12:15", "remaining_time": "0:49:32", "throughput": 5958.11, "total_tokens": 4383800} {"current_steps": 6735, "total_steps": 33920, "loss": 0.6916, "lr": 9.707200068805764e-06, "epoch": 3.9711084905660377, "percentage": 19.86, "elapsed_time": "0:12:16", "remaining_time": "0:49:32", "throughput": 5958.56, "total_tokens": 4387576} {"current_steps": 6740, "total_steps": 33920, "loss": 0.3833, "lr": 9.706331976646817e-06, "epoch": 3.974056603773585, "percentage": 19.87, "elapsed_time": "0:12:16", "remaining_time": "0:49:31", "throughput": 5958.89, "total_tokens": 4391224} {"current_steps": 6745, "total_steps": 33920, "loss": 0.4771, "lr": 9.705462638466197e-06, "epoch": 3.9770047169811322, "percentage": 19.89, "elapsed_time": "0:12:17", "remaining_time": "0:49:30", "throughput": 5958.89, "total_tokens": 4394072} {"current_steps": 6750, "total_steps": 33920, "loss": 0.4634, "lr": 9.704592054494065e-06, "epoch": 3.9799528301886795, "percentage": 19.9, "elapsed_time": "0:12:17", "remaining_time": "0:49:30", "throughput": 5959.46, "total_tokens": 4397784} {"current_steps": 6755, "total_steps": 33920, "loss": 0.56, "lr": 9.703720224960909e-06, "epoch": 3.9829009433962264, "percentage": 19.91, "elapsed_time": "0:12:18", "remaining_time": "0:49:29", "throughput": 5959.67, "total_tokens": 4400984} {"current_steps": 6760, "total_steps": 33920, "loss": 0.4941, "lr": 9.702847150097552e-06, "epoch": 3.9858490566037736, "percentage": 19.93, "elapsed_time": "0:12:19", "remaining_time": "0:49:29", "throughput": 5960.19, "total_tokens": 4404760} {"current_steps": 6765, "total_steps": 33920, "loss": 0.5114, "lr": 9.701972830135143e-06, "epoch": 3.9887971698113205, "percentage": 19.94, "elapsed_time": "0:12:19", "remaining_time": "0:49:28", "throughput": 5960.26, "total_tokens": 4407928} {"current_steps": 6770, "total_steps": 33920, "loss": 0.4297, "lr": 9.701097265305164e-06, "epoch": 3.9917452830188678, "percentage": 19.96, "elapsed_time": "0:12:20", "remaining_time": "0:49:27", "throughput": 5960.09, "total_tokens": 4410552} {"current_steps": 6775, "total_steps": 33920, "loss": 0.4422, "lr": 9.700220455839422e-06, "epoch": 3.994693396226415, "percentage": 19.97, "elapsed_time": "0:12:20", "remaining_time": "0:49:27", "throughput": 5960.37, "total_tokens": 4414200} {"current_steps": 6780, "total_steps": 33920, "loss": 0.4471, "lr": 9.69934240197006e-06, "epoch": 3.9976415094339623, "percentage": 19.99, "elapsed_time": "0:12:21", "remaining_time": "0:49:26", "throughput": 5960.63, "total_tokens": 4417528} {"current_steps": 6784, "total_steps": 33920, "eval_loss": 0.5017365217208862, "epoch": 4.0, "percentage": 20.0, "elapsed_time": "0:12:40", "remaining_time": "0:50:42", "throughput": 5810.39, "total_tokens": 4419816} {"current_steps": 6785, "total_steps": 33920, "loss": 0.4823, "lr": 9.698463103929542e-06, "epoch": 4.00058962264151, "percentage": 20.0, "elapsed_time": "0:12:44", "remaining_time": "0:50:55", "throughput": 5785.29, "total_tokens": 4420648} {"current_steps": 6790, "total_steps": 33920, "loss": 0.5052, "lr": 9.697582561950669e-06, "epoch": 4.003537735849057, "percentage": 20.02, "elapsed_time": "0:12:44", "remaining_time": "0:50:55", "throughput": 5786.02, "total_tokens": 4424936} {"current_steps": 6795, "total_steps": 33920, "loss": 0.3518, "lr": 9.696700776266568e-06, "epoch": 4.006485849056604, "percentage": 20.03, "elapsed_time": "0:12:45", "remaining_time": "0:50:55", "throughput": 5786.4, "total_tokens": 4428552} {"current_steps": 6800, "total_steps": 33920, "loss": 0.5587, "lr": 9.695817747110694e-06, "epoch": 4.009433962264151, "percentage": 20.05, "elapsed_time": "0:12:45", "remaining_time": "0:50:54", "throughput": 5786.79, "total_tokens": 4432008} {"current_steps": 6805, "total_steps": 33920, "loss": 0.5803, "lr": 9.694933474716831e-06, "epoch": 4.012382075471698, "percentage": 20.06, "elapsed_time": "0:12:46", "remaining_time": "0:50:53", "throughput": 5786.69, "total_tokens": 4434664} {"current_steps": 6810, "total_steps": 33920, "loss": 0.5447, "lr": 9.6940479593191e-06, "epoch": 4.015330188679245, "percentage": 20.08, "elapsed_time": "0:12:46", "remaining_time": "0:50:52", "throughput": 5786.58, "total_tokens": 4437384} {"current_steps": 6815, "total_steps": 33920, "loss": 0.4246, "lr": 9.693161201151942e-06, "epoch": 4.0182783018867925, "percentage": 20.09, "elapsed_time": "0:12:47", "remaining_time": "0:50:51", "throughput": 5786.1, "total_tokens": 4439816} {"current_steps": 6820, "total_steps": 33920, "loss": 0.5792, "lr": 9.692273200450128e-06, "epoch": 4.02122641509434, "percentage": 20.11, "elapsed_time": "0:12:47", "remaining_time": "0:50:51", "throughput": 5787.06, "total_tokens": 4444392} {"current_steps": 6825, "total_steps": 33920, "loss": 0.4606, "lr": 9.69138395744876e-06, "epoch": 4.024174528301887, "percentage": 20.12, "elapsed_time": "0:12:48", "remaining_time": "0:50:51", "throughput": 5787.33, "total_tokens": 4447784} {"current_steps": 6830, "total_steps": 33920, "loss": 0.454, "lr": 9.690493472383274e-06, "epoch": 4.027122641509434, "percentage": 20.14, "elapsed_time": "0:12:49", "remaining_time": "0:50:50", "throughput": 5787.38, "total_tokens": 4450728} {"current_steps": 6835, "total_steps": 33920, "loss": 0.4411, "lr": 9.689601745489423e-06, "epoch": 4.030070754716981, "percentage": 20.15, "elapsed_time": "0:12:49", "remaining_time": "0:50:49", "throughput": 5788.18, "total_tokens": 4454696} {"current_steps": 6840, "total_steps": 33920, "loss": 0.3798, "lr": 9.6887087770033e-06, "epoch": 4.033018867924528, "percentage": 20.17, "elapsed_time": "0:12:50", "remaining_time": "0:50:49", "throughput": 5788.91, "total_tokens": 4458472} {"current_steps": 6845, "total_steps": 33920, "loss": 0.3346, "lr": 9.687814567161322e-06, "epoch": 4.035966981132075, "percentage": 20.18, "elapsed_time": "0:12:50", "remaining_time": "0:50:48", "throughput": 5788.96, "total_tokens": 4461320} {"current_steps": 6850, "total_steps": 33920, "loss": 0.429, "lr": 9.686919116200232e-06, "epoch": 4.038915094339623, "percentage": 20.19, "elapsed_time": "0:12:51", "remaining_time": "0:50:47", "throughput": 5789.11, "total_tokens": 4464488} {"current_steps": 6855, "total_steps": 33920, "loss": 0.3172, "lr": 9.686022424357108e-06, "epoch": 4.04186320754717, "percentage": 20.21, "elapsed_time": "0:12:51", "remaining_time": "0:50:47", "throughput": 5789.65, "total_tokens": 4468296} {"current_steps": 6860, "total_steps": 33920, "loss": 0.4137, "lr": 9.685124491869353e-06, "epoch": 4.044811320754717, "percentage": 20.22, "elapsed_time": "0:12:52", "remaining_time": "0:50:46", "throughput": 5789.76, "total_tokens": 4471208} {"current_steps": 6865, "total_steps": 33920, "loss": 0.5474, "lr": 9.684225318974696e-06, "epoch": 4.0477594339622645, "percentage": 20.24, "elapsed_time": "0:12:52", "remaining_time": "0:50:45", "throughput": 5789.84, "total_tokens": 4473992} {"current_steps": 6870, "total_steps": 33920, "loss": 0.4243, "lr": 9.683324905911197e-06, "epoch": 4.050707547169812, "percentage": 20.25, "elapsed_time": "0:12:53", "remaining_time": "0:50:44", "throughput": 5790.11, "total_tokens": 4477288} {"current_steps": 6875, "total_steps": 33920, "loss": 0.4147, "lr": 9.682423252917245e-06, "epoch": 4.053655660377358, "percentage": 20.27, "elapsed_time": "0:12:53", "remaining_time": "0:50:44", "throughput": 5790.65, "total_tokens": 4480840} {"current_steps": 6880, "total_steps": 33920, "loss": 0.3714, "lr": 9.681520360231557e-06, "epoch": 4.056603773584905, "percentage": 20.28, "elapsed_time": "0:12:54", "remaining_time": "0:50:43", "throughput": 5791.05, "total_tokens": 4484360} {"current_steps": 6885, "total_steps": 33920, "loss": 0.4868, "lr": 9.680616228093178e-06, "epoch": 4.059551886792453, "percentage": 20.3, "elapsed_time": "0:12:54", "remaining_time": "0:50:42", "throughput": 5791.21, "total_tokens": 4487368} {"current_steps": 6890, "total_steps": 33920, "loss": 0.5315, "lr": 9.67971085674148e-06, "epoch": 4.0625, "percentage": 20.31, "elapsed_time": "0:12:55", "remaining_time": "0:50:42", "throughput": 5791.77, "total_tokens": 4491016} {"current_steps": 6895, "total_steps": 33920, "loss": 0.4361, "lr": 9.678804246416164e-06, "epoch": 4.065448113207547, "percentage": 20.33, "elapsed_time": "0:12:55", "remaining_time": "0:50:41", "throughput": 5792.33, "total_tokens": 4494824} {"current_steps": 6900, "total_steps": 33920, "loss": 0.4544, "lr": 9.677896397357259e-06, "epoch": 4.068396226415095, "percentage": 20.34, "elapsed_time": "0:12:56", "remaining_time": "0:50:40", "throughput": 5792.41, "total_tokens": 4497704} {"current_steps": 6905, "total_steps": 33920, "loss": 0.4551, "lr": 9.676987309805121e-06, "epoch": 4.071344339622642, "percentage": 20.36, "elapsed_time": "0:12:56", "remaining_time": "0:50:39", "throughput": 5792.55, "total_tokens": 4500808} {"current_steps": 6910, "total_steps": 33920, "loss": 0.5567, "lr": 9.67607698400044e-06, "epoch": 4.074292452830188, "percentage": 20.37, "elapsed_time": "0:12:57", "remaining_time": "0:50:39", "throughput": 5793.17, "total_tokens": 4504520} {"current_steps": 6915, "total_steps": 33920, "loss": 0.4292, "lr": 9.67516542018422e-06, "epoch": 4.0772405660377355, "percentage": 20.39, "elapsed_time": "0:12:58", "remaining_time": "0:50:38", "throughput": 5793.1, "total_tokens": 4507400} {"current_steps": 6920, "total_steps": 33920, "loss": 0.4802, "lr": 9.67425261859781e-06, "epoch": 4.080188679245283, "percentage": 20.4, "elapsed_time": "0:12:58", "remaining_time": "0:50:37", "throughput": 5793.31, "total_tokens": 4510536} {"current_steps": 6925, "total_steps": 33920, "loss": 0.4879, "lr": 9.673338579482871e-06, "epoch": 4.08313679245283, "percentage": 20.42, "elapsed_time": "0:12:59", "remaining_time": "0:50:36", "throughput": 5793.53, "total_tokens": 4513608} {"current_steps": 6930, "total_steps": 33920, "loss": 0.4857, "lr": 9.672423303081404e-06, "epoch": 4.086084905660377, "percentage": 20.43, "elapsed_time": "0:12:59", "remaining_time": "0:50:36", "throughput": 5793.77, "total_tokens": 4516744} {"current_steps": 6935, "total_steps": 33920, "loss": 0.4397, "lr": 9.67150678963573e-06, "epoch": 4.089033018867925, "percentage": 20.45, "elapsed_time": "0:13:00", "remaining_time": "0:50:35", "throughput": 5793.89, "total_tokens": 4519976} {"current_steps": 6940, "total_steps": 33920, "loss": 0.3999, "lr": 9.670589039388501e-06, "epoch": 4.091981132075472, "percentage": 20.46, "elapsed_time": "0:13:00", "remaining_time": "0:50:34", "throughput": 5794.06, "total_tokens": 4523016} {"current_steps": 6945, "total_steps": 33920, "loss": 0.342, "lr": 9.669670052582695e-06, "epoch": 4.094929245283019, "percentage": 20.47, "elapsed_time": "0:13:01", "remaining_time": "0:50:34", "throughput": 5794.45, "total_tokens": 4526728} {"current_steps": 6950, "total_steps": 33920, "loss": 0.492, "lr": 9.668749829461617e-06, "epoch": 4.097877358490566, "percentage": 20.49, "elapsed_time": "0:13:01", "remaining_time": "0:50:34", "throughput": 5795.43, "total_tokens": 4531688} {"current_steps": 6955, "total_steps": 33920, "loss": 0.41, "lr": 9.667828370268898e-06, "epoch": 4.100825471698113, "percentage": 20.5, "elapsed_time": "0:13:02", "remaining_time": "0:50:33", "throughput": 5795.5, "total_tokens": 4534632} {"current_steps": 6960, "total_steps": 33920, "loss": 0.3829, "lr": 9.666905675248505e-06, "epoch": 4.10377358490566, "percentage": 20.52, "elapsed_time": "0:13:03", "remaining_time": "0:50:33", "throughput": 5796.09, "total_tokens": 4538376} {"current_steps": 6965, "total_steps": 33920, "loss": 0.4228, "lr": 9.66598174464472e-06, "epoch": 4.1067216981132075, "percentage": 20.53, "elapsed_time": "0:13:03", "remaining_time": "0:50:32", "throughput": 5796.72, "total_tokens": 4542152} {"current_steps": 6970, "total_steps": 33920, "loss": 0.4163, "lr": 9.665056578702157e-06, "epoch": 4.109669811320755, "percentage": 20.55, "elapsed_time": "0:13:04", "remaining_time": "0:50:32", "throughput": 5797.33, "total_tokens": 4546120} {"current_steps": 6975, "total_steps": 33920, "loss": 0.6089, "lr": 9.66413017766576e-06, "epoch": 4.112617924528302, "percentage": 20.56, "elapsed_time": "0:13:04", "remaining_time": "0:50:31", "throughput": 5798.12, "total_tokens": 4550504} {"current_steps": 6980, "total_steps": 33920, "loss": 0.3702, "lr": 9.663202541780799e-06, "epoch": 4.115566037735849, "percentage": 20.58, "elapsed_time": "0:13:05", "remaining_time": "0:50:30", "throughput": 5798.19, "total_tokens": 4553384} {"current_steps": 6985, "total_steps": 33920, "loss": 0.3795, "lr": 9.662273671292866e-06, "epoch": 4.118514150943396, "percentage": 20.59, "elapsed_time": "0:13:05", "remaining_time": "0:50:30", "throughput": 5798.44, "total_tokens": 4556456} {"current_steps": 6990, "total_steps": 33920, "loss": 0.5846, "lr": 9.661343566447886e-06, "epoch": 4.121462264150943, "percentage": 20.61, "elapsed_time": "0:13:06", "remaining_time": "0:50:29", "throughput": 5798.38, "total_tokens": 4559112} {"current_steps": 6995, "total_steps": 33920, "loss": 0.6382, "lr": 9.660412227492107e-06, "epoch": 4.12441037735849, "percentage": 20.62, "elapsed_time": "0:13:06", "remaining_time": "0:50:28", "throughput": 5799.1, "total_tokens": 4563112} {"current_steps": 7000, "total_steps": 33920, "loss": 0.4016, "lr": 9.659479654672106e-06, "epoch": 4.127358490566038, "percentage": 20.64, "elapsed_time": "0:13:07", "remaining_time": "0:50:27", "throughput": 5799.43, "total_tokens": 4566120} {"current_steps": 7005, "total_steps": 33920, "loss": 0.4114, "lr": 9.658545848234784e-06, "epoch": 4.130306603773585, "percentage": 20.65, "elapsed_time": "0:13:07", "remaining_time": "0:50:26", "throughput": 5799.55, "total_tokens": 4568936} {"current_steps": 7010, "total_steps": 33920, "loss": 0.7058, "lr": 9.657610808427372e-06, "epoch": 4.133254716981132, "percentage": 20.67, "elapsed_time": "0:13:08", "remaining_time": "0:50:26", "throughput": 5799.57, "total_tokens": 4571944} {"current_steps": 7015, "total_steps": 33920, "loss": 0.4962, "lr": 9.656674535497425e-06, "epoch": 4.1362028301886795, "percentage": 20.68, "elapsed_time": "0:13:08", "remaining_time": "0:50:25", "throughput": 5800.17, "total_tokens": 4575624} {"current_steps": 7020, "total_steps": 33920, "loss": 0.5222, "lr": 9.655737029692827e-06, "epoch": 4.139150943396227, "percentage": 20.7, "elapsed_time": "0:13:09", "remaining_time": "0:50:24", "throughput": 5800.06, "total_tokens": 4578280} {"current_steps": 7025, "total_steps": 33920, "loss": 0.4279, "lr": 9.654798291261785e-06, "epoch": 4.142099056603773, "percentage": 20.71, "elapsed_time": "0:13:09", "remaining_time": "0:50:24", "throughput": 5800.43, "total_tokens": 4582024} {"current_steps": 7030, "total_steps": 33920, "loss": 0.4952, "lr": 9.653858320452833e-06, "epoch": 4.1450471698113205, "percentage": 20.73, "elapsed_time": "0:13:10", "remaining_time": "0:50:23", "throughput": 5801.25, "total_tokens": 4586344} {"current_steps": 7035, "total_steps": 33920, "loss": 0.3986, "lr": 9.652917117514836e-06, "epoch": 4.147995283018868, "percentage": 20.74, "elapsed_time": "0:13:11", "remaining_time": "0:50:23", "throughput": 5801.32, "total_tokens": 4589576} {"current_steps": 7040, "total_steps": 33920, "loss": 0.3703, "lr": 9.651974682696975e-06, "epoch": 4.150943396226415, "percentage": 20.75, "elapsed_time": "0:13:11", "remaining_time": "0:50:22", "throughput": 5802.1, "total_tokens": 4593736} {"current_steps": 7045, "total_steps": 33920, "loss": 0.5401, "lr": 9.651031016248773e-06, "epoch": 4.153891509433962, "percentage": 20.77, "elapsed_time": "0:13:12", "remaining_time": "0:50:22", "throughput": 5801.61, "total_tokens": 4596072} {"current_steps": 7050, "total_steps": 33920, "loss": 0.3957, "lr": 9.65008611842006e-06, "epoch": 4.15683962264151, "percentage": 20.78, "elapsed_time": "0:13:12", "remaining_time": "0:50:21", "throughput": 5802.14, "total_tokens": 4599528} {"current_steps": 7055, "total_steps": 33920, "loss": 0.5267, "lr": 9.64913998946101e-06, "epoch": 4.159787735849057, "percentage": 20.8, "elapsed_time": "0:13:13", "remaining_time": "0:50:20", "throughput": 5801.68, "total_tokens": 4601736} {"current_steps": 7060, "total_steps": 33920, "loss": 0.4864, "lr": 9.648192629622109e-06, "epoch": 4.162735849056604, "percentage": 20.81, "elapsed_time": "0:13:13", "remaining_time": "0:50:20", "throughput": 5802.56, "total_tokens": 4606088} {"current_steps": 7065, "total_steps": 33920, "loss": 0.452, "lr": 9.647244039154178e-06, "epoch": 4.165683962264151, "percentage": 20.83, "elapsed_time": "0:13:14", "remaining_time": "0:50:19", "throughput": 5802.47, "total_tokens": 4608712} {"current_steps": 7070, "total_steps": 33920, "loss": 0.5189, "lr": 9.64629421830836e-06, "epoch": 4.168632075471698, "percentage": 20.84, "elapsed_time": "0:13:14", "remaining_time": "0:50:18", "throughput": 5802.77, "total_tokens": 4611752} {"current_steps": 7075, "total_steps": 33920, "loss": 0.3933, "lr": 9.64534316733612e-06, "epoch": 4.171580188679245, "percentage": 20.86, "elapsed_time": "0:13:15", "remaining_time": "0:50:17", "throughput": 5802.63, "total_tokens": 4614184} {"current_steps": 7080, "total_steps": 33920, "loss": 0.5269, "lr": 9.644390886489258e-06, "epoch": 4.1745283018867925, "percentage": 20.87, "elapsed_time": "0:13:15", "remaining_time": "0:50:17", "throughput": 5803.51, "total_tokens": 4618856} {"current_steps": 7085, "total_steps": 33920, "loss": 0.5745, "lr": 9.643437376019893e-06, "epoch": 4.17747641509434, "percentage": 20.89, "elapsed_time": "0:13:16", "remaining_time": "0:50:16", "throughput": 5804.17, "total_tokens": 4622568} {"current_steps": 7090, "total_steps": 33920, "loss": 0.4525, "lr": 9.64248263618047e-06, "epoch": 4.180424528301887, "percentage": 20.9, "elapsed_time": "0:13:17", "remaining_time": "0:50:16", "throughput": 5804.61, "total_tokens": 4626856} {"current_steps": 7095, "total_steps": 33920, "loss": 0.4558, "lr": 9.64152666722376e-06, "epoch": 4.183372641509434, "percentage": 20.92, "elapsed_time": "0:13:17", "remaining_time": "0:50:16", "throughput": 5805.42, "total_tokens": 4631048} {"current_steps": 7100, "total_steps": 33920, "loss": 0.4706, "lr": 9.640569469402863e-06, "epoch": 4.186320754716981, "percentage": 20.93, "elapsed_time": "0:13:18", "remaining_time": "0:50:15", "throughput": 5805.72, "total_tokens": 4634088} {"current_steps": 7105, "total_steps": 33920, "loss": 0.4729, "lr": 9.639611042971198e-06, "epoch": 4.189268867924528, "percentage": 20.95, "elapsed_time": "0:13:18", "remaining_time": "0:50:14", "throughput": 5806.31, "total_tokens": 4638056} {"current_steps": 7110, "total_steps": 33920, "loss": 0.5465, "lr": 9.638651388182514e-06, "epoch": 4.192216981132075, "percentage": 20.96, "elapsed_time": "0:13:19", "remaining_time": "0:50:13", "throughput": 5806.35, "total_tokens": 4640744} {"current_steps": 7115, "total_steps": 33920, "loss": 0.5278, "lr": 9.637690505290884e-06, "epoch": 4.195165094339623, "percentage": 20.98, "elapsed_time": "0:13:19", "remaining_time": "0:50:13", "throughput": 5805.99, "total_tokens": 4643432} {"current_steps": 7120, "total_steps": 33920, "loss": 0.473, "lr": 9.636728394550705e-06, "epoch": 4.19811320754717, "percentage": 20.99, "elapsed_time": "0:13:20", "remaining_time": "0:50:12", "throughput": 5805.92, "total_tokens": 4646184} {"current_steps": 7125, "total_steps": 33920, "loss": 0.4971, "lr": 9.6357650562167e-06, "epoch": 4.201061320754717, "percentage": 21.01, "elapsed_time": "0:13:20", "remaining_time": "0:50:11", "throughput": 5806.01, "total_tokens": 4649064} {"current_steps": 7130, "total_steps": 33920, "loss": 0.4081, "lr": 9.634800490543918e-06, "epoch": 4.2040094339622645, "percentage": 21.02, "elapsed_time": "0:13:21", "remaining_time": "0:50:10", "throughput": 5806.32, "total_tokens": 4652360} {"current_steps": 7135, "total_steps": 33920, "loss": 0.4657, "lr": 9.633834697787731e-06, "epoch": 4.206957547169812, "percentage": 21.03, "elapsed_time": "0:13:21", "remaining_time": "0:50:09", "throughput": 5806.17, "total_tokens": 4655080} {"current_steps": 7140, "total_steps": 33920, "loss": 0.519, "lr": 9.632867678203836e-06, "epoch": 4.209905660377358, "percentage": 21.05, "elapsed_time": "0:13:22", "remaining_time": "0:50:08", "throughput": 5805.54, "total_tokens": 4657384} {"current_steps": 7145, "total_steps": 33920, "loss": 0.3374, "lr": 9.631899432048258e-06, "epoch": 4.212853773584905, "percentage": 21.06, "elapsed_time": "0:13:22", "remaining_time": "0:50:08", "throughput": 5805.65, "total_tokens": 4660296} {"current_steps": 7150, "total_steps": 33920, "loss": 0.5037, "lr": 9.630929959577343e-06, "epoch": 4.215801886792453, "percentage": 21.08, "elapsed_time": "0:13:23", "remaining_time": "0:50:07", "throughput": 5806.42, "total_tokens": 4664360} {"current_steps": 7155, "total_steps": 33920, "loss": 0.448, "lr": 9.629959261047764e-06, "epoch": 4.21875, "percentage": 21.09, "elapsed_time": "0:13:23", "remaining_time": "0:50:07", "throughput": 5807.1, "total_tokens": 4668360} {"current_steps": 7160, "total_steps": 33920, "loss": 0.5411, "lr": 9.628987336716513e-06, "epoch": 4.221698113207547, "percentage": 21.11, "elapsed_time": "0:13:24", "remaining_time": "0:50:06", "throughput": 5807.37, "total_tokens": 4671528} {"current_steps": 7165, "total_steps": 33920, "loss": 0.4886, "lr": 9.628014186840918e-06, "epoch": 4.224646226415095, "percentage": 21.12, "elapsed_time": "0:13:24", "remaining_time": "0:50:05", "throughput": 5807.58, "total_tokens": 4675016} {"current_steps": 7170, "total_steps": 33920, "loss": 0.4901, "lr": 9.62703981167862e-06, "epoch": 4.227594339622642, "percentage": 21.14, "elapsed_time": "0:13:25", "remaining_time": "0:50:05", "throughput": 5807.43, "total_tokens": 4677768} {"current_steps": 7175, "total_steps": 33920, "loss": 0.4378, "lr": 9.626064211487592e-06, "epoch": 4.230542452830188, "percentage": 21.15, "elapsed_time": "0:13:26", "remaining_time": "0:50:04", "throughput": 5807.76, "total_tokens": 4681064} {"current_steps": 7180, "total_steps": 33920, "loss": 0.5005, "lr": 9.625087386526125e-06, "epoch": 4.2334905660377355, "percentage": 21.17, "elapsed_time": "0:13:26", "remaining_time": "0:50:03", "throughput": 5807.53, "total_tokens": 4683784} {"current_steps": 7185, "total_steps": 33920, "loss": 0.4803, "lr": 9.624109337052839e-06, "epoch": 4.236438679245283, "percentage": 21.18, "elapsed_time": "0:13:27", "remaining_time": "0:50:03", "throughput": 5807.47, "total_tokens": 4687080} {"current_steps": 7190, "total_steps": 33920, "loss": 0.4852, "lr": 9.623130063326678e-06, "epoch": 4.23938679245283, "percentage": 21.2, "elapsed_time": "0:13:27", "remaining_time": "0:50:02", "throughput": 5807.13, "total_tokens": 4689544} {"current_steps": 7195, "total_steps": 33920, "loss": 0.4812, "lr": 9.622149565606909e-06, "epoch": 4.242334905660377, "percentage": 21.21, "elapsed_time": "0:13:28", "remaining_time": "0:50:01", "throughput": 5807.92, "total_tokens": 4693640} {"current_steps": 7200, "total_steps": 33920, "loss": 0.4102, "lr": 9.621167844153122e-06, "epoch": 4.245283018867925, "percentage": 21.23, "elapsed_time": "0:13:28", "remaining_time": "0:50:00", "throughput": 5808.11, "total_tokens": 4696616} {"current_steps": 7205, "total_steps": 33920, "loss": 0.557, "lr": 9.620184899225231e-06, "epoch": 4.248231132075472, "percentage": 21.24, "elapsed_time": "0:13:29", "remaining_time": "0:50:00", "throughput": 5808.86, "total_tokens": 4700904} {"current_steps": 7210, "total_steps": 33920, "loss": 0.507, "lr": 9.619200731083477e-06, "epoch": 4.251179245283019, "percentage": 21.26, "elapsed_time": "0:13:29", "remaining_time": "0:49:59", "throughput": 5809.02, "total_tokens": 4703912} {"current_steps": 7215, "total_steps": 33920, "loss": 0.6216, "lr": 9.618215339988422e-06, "epoch": 4.254127358490566, "percentage": 21.27, "elapsed_time": "0:13:30", "remaining_time": "0:49:59", "throughput": 5809.32, "total_tokens": 4707048} {"current_steps": 7220, "total_steps": 33920, "loss": 0.4979, "lr": 9.617228726200951e-06, "epoch": 4.257075471698113, "percentage": 21.29, "elapsed_time": "0:13:30", "remaining_time": "0:49:58", "throughput": 5809.69, "total_tokens": 4710312} {"current_steps": 7225, "total_steps": 33920, "loss": 0.384, "lr": 9.616240889982277e-06, "epoch": 4.26002358490566, "percentage": 21.3, "elapsed_time": "0:13:31", "remaining_time": "0:49:57", "throughput": 5809.94, "total_tokens": 4713384} {"current_steps": 7230, "total_steps": 33920, "loss": 0.4548, "lr": 9.61525183159393e-06, "epoch": 4.2629716981132075, "percentage": 21.31, "elapsed_time": "0:13:31", "remaining_time": "0:49:56", "throughput": 5810.13, "total_tokens": 4716168} {"current_steps": 7235, "total_steps": 33920, "loss": 0.3812, "lr": 9.614261551297774e-06, "epoch": 4.265919811320755, "percentage": 21.33, "elapsed_time": "0:13:32", "remaining_time": "0:49:55", "throughput": 5810.45, "total_tokens": 4719368} {"current_steps": 7240, "total_steps": 33920, "loss": 0.4746, "lr": 9.613270049355983e-06, "epoch": 4.268867924528302, "percentage": 21.34, "elapsed_time": "0:13:32", "remaining_time": "0:49:54", "throughput": 5810.74, "total_tokens": 4722536} {"current_steps": 7245, "total_steps": 33920, "loss": 0.4638, "lr": 9.612277326031065e-06, "epoch": 4.271816037735849, "percentage": 21.36, "elapsed_time": "0:13:33", "remaining_time": "0:49:54", "throughput": 5811.08, "total_tokens": 4726056} {"current_steps": 7250, "total_steps": 33920, "loss": 0.4333, "lr": 9.611283381585848e-06, "epoch": 4.274764150943396, "percentage": 21.37, "elapsed_time": "0:13:33", "remaining_time": "0:49:53", "throughput": 5810.99, "total_tokens": 4728712} {"current_steps": 7255, "total_steps": 33920, "loss": 0.4202, "lr": 9.61028821628348e-06, "epoch": 4.277712264150943, "percentage": 21.39, "elapsed_time": "0:13:34", "remaining_time": "0:49:52", "throughput": 5811.56, "total_tokens": 4732328} {"current_steps": 7260, "total_steps": 33920, "loss": 0.7485, "lr": 9.609291830387439e-06, "epoch": 4.28066037735849, "percentage": 21.4, "elapsed_time": "0:13:34", "remaining_time": "0:49:52", "throughput": 5811.66, "total_tokens": 4735240} {"current_steps": 7265, "total_steps": 33920, "loss": 0.3855, "lr": 9.608294224161523e-06, "epoch": 4.283608490566038, "percentage": 21.42, "elapsed_time": "0:13:35", "remaining_time": "0:49:51", "throughput": 5812.31, "total_tokens": 4739112} {"current_steps": 7270, "total_steps": 33920, "loss": 0.5807, "lr": 9.607295397869847e-06, "epoch": 4.286556603773585, "percentage": 21.43, "elapsed_time": "0:13:35", "remaining_time": "0:49:50", "throughput": 5812.03, "total_tokens": 4741640} {"current_steps": 7275, "total_steps": 33920, "loss": 0.5031, "lr": 9.60629535177686e-06, "epoch": 4.289504716981132, "percentage": 21.45, "elapsed_time": "0:13:36", "remaining_time": "0:49:49", "throughput": 5811.89, "total_tokens": 4744104} {"current_steps": 7280, "total_steps": 33920, "loss": 0.6573, "lr": 9.605294086147325e-06, "epoch": 4.2924528301886795, "percentage": 21.46, "elapsed_time": "0:13:36", "remaining_time": "0:49:49", "throughput": 5812.49, "total_tokens": 4747880} {"current_steps": 7285, "total_steps": 33920, "loss": 0.5157, "lr": 9.604291601246333e-06, "epoch": 4.295400943396227, "percentage": 21.48, "elapsed_time": "0:13:37", "remaining_time": "0:49:48", "throughput": 5812.41, "total_tokens": 4750728} {"current_steps": 7290, "total_steps": 33920, "loss": 0.3689, "lr": 9.603287897339299e-06, "epoch": 4.298349056603773, "percentage": 21.49, "elapsed_time": "0:13:37", "remaining_time": "0:49:47", "throughput": 5812.6, "total_tokens": 4754088} {"current_steps": 7295, "total_steps": 33920, "loss": 0.3235, "lr": 9.602282974691953e-06, "epoch": 4.3012971698113205, "percentage": 21.51, "elapsed_time": "0:13:38", "remaining_time": "0:49:47", "throughput": 5812.67, "total_tokens": 4757256} {"current_steps": 7300, "total_steps": 33920, "loss": 0.5108, "lr": 9.601276833570355e-06, "epoch": 4.304245283018868, "percentage": 21.52, "elapsed_time": "0:13:38", "remaining_time": "0:49:46", "throughput": 5812.86, "total_tokens": 4760264} {"current_steps": 7305, "total_steps": 33920, "loss": 0.3417, "lr": 9.600269474240885e-06, "epoch": 4.307193396226415, "percentage": 21.54, "elapsed_time": "0:13:39", "remaining_time": "0:49:45", "throughput": 5812.23, "total_tokens": 4762440} {"current_steps": 7310, "total_steps": 33920, "loss": 0.6009, "lr": 9.599260896970246e-06, "epoch": 4.310141509433962, "percentage": 21.55, "elapsed_time": "0:13:40", "remaining_time": "0:49:45", "throughput": 5812.71, "total_tokens": 4766600} {"current_steps": 7315, "total_steps": 33920, "loss": 0.3808, "lr": 9.598251102025463e-06, "epoch": 4.31308962264151, "percentage": 21.57, "elapsed_time": "0:13:40", "remaining_time": "0:49:44", "throughput": 5812.32, "total_tokens": 4769320} {"current_steps": 7320, "total_steps": 33920, "loss": 0.5002, "lr": 9.597240089673882e-06, "epoch": 4.316037735849057, "percentage": 21.58, "elapsed_time": "0:13:41", "remaining_time": "0:49:43", "throughput": 5812.34, "total_tokens": 4772136} {"current_steps": 7325, "total_steps": 33920, "loss": 0.4178, "lr": 9.596227860183175e-06, "epoch": 4.318985849056604, "percentage": 21.59, "elapsed_time": "0:13:41", "remaining_time": "0:49:42", "throughput": 5812.38, "total_tokens": 4774920} {"current_steps": 7330, "total_steps": 33920, "loss": 0.3371, "lr": 9.595214413821334e-06, "epoch": 4.321933962264151, "percentage": 21.61, "elapsed_time": "0:13:42", "remaining_time": "0:49:42", "throughput": 5812.61, "total_tokens": 4778632} {"current_steps": 7335, "total_steps": 33920, "loss": 0.5201, "lr": 9.59419975085667e-06, "epoch": 4.324882075471698, "percentage": 21.62, "elapsed_time": "0:13:42", "remaining_time": "0:49:41", "throughput": 5813.18, "total_tokens": 4782248} {"current_steps": 7340, "total_steps": 33920, "loss": 0.4916, "lr": 9.593183871557826e-06, "epoch": 4.327830188679245, "percentage": 21.64, "elapsed_time": "0:13:43", "remaining_time": "0:49:40", "throughput": 5813.27, "total_tokens": 4785256} {"current_steps": 7345, "total_steps": 33920, "loss": 0.3618, "lr": 9.592166776193754e-06, "epoch": 4.3307783018867925, "percentage": 21.65, "elapsed_time": "0:13:43", "remaining_time": "0:49:40", "throughput": 5813.28, "total_tokens": 4788360} {"current_steps": 7350, "total_steps": 33920, "loss": 0.4221, "lr": 9.591148465033738e-06, "epoch": 4.33372641509434, "percentage": 21.67, "elapsed_time": "0:13:44", "remaining_time": "0:49:39", "throughput": 5813.6, "total_tokens": 4791848} {"current_steps": 7355, "total_steps": 33920, "loss": 0.4216, "lr": 9.590128938347378e-06, "epoch": 4.336674528301887, "percentage": 21.68, "elapsed_time": "0:13:44", "remaining_time": "0:49:38", "throughput": 5813.59, "total_tokens": 4794760} {"current_steps": 7360, "total_steps": 33920, "loss": 0.4328, "lr": 9.589108196404599e-06, "epoch": 4.339622641509434, "percentage": 21.7, "elapsed_time": "0:13:45", "remaining_time": "0:49:38", "throughput": 5813.37, "total_tokens": 4797608} {"current_steps": 7365, "total_steps": 33920, "loss": 0.4152, "lr": 9.588086239475649e-06, "epoch": 4.342570754716981, "percentage": 21.71, "elapsed_time": "0:13:45", "remaining_time": "0:49:37", "throughput": 5813.82, "total_tokens": 4801224} {"current_steps": 7370, "total_steps": 33920, "loss": 0.4721, "lr": 9.587063067831092e-06, "epoch": 4.345518867924528, "percentage": 21.73, "elapsed_time": "0:13:46", "remaining_time": "0:49:36", "throughput": 5814.08, "total_tokens": 4804488} {"current_steps": 7375, "total_steps": 33920, "loss": 0.4086, "lr": 9.586038681741818e-06, "epoch": 4.348466981132075, "percentage": 21.74, "elapsed_time": "0:13:46", "remaining_time": "0:49:36", "throughput": 5813.62, "total_tokens": 4806984} {"current_steps": 7380, "total_steps": 33920, "loss": 0.6139, "lr": 9.58501308147904e-06, "epoch": 4.351415094339623, "percentage": 21.76, "elapsed_time": "0:13:47", "remaining_time": "0:49:35", "throughput": 5813.94, "total_tokens": 4810280} {"current_steps": 7385, "total_steps": 33920, "loss": 0.4688, "lr": 9.583986267314288e-06, "epoch": 4.35436320754717, "percentage": 21.77, "elapsed_time": "0:13:47", "remaining_time": "0:49:34", "throughput": 5813.85, "total_tokens": 4813320} {"current_steps": 7390, "total_steps": 33920, "loss": 0.5089, "lr": 9.582958239519416e-06, "epoch": 4.357311320754717, "percentage": 21.79, "elapsed_time": "0:13:48", "remaining_time": "0:49:33", "throughput": 5813.92, "total_tokens": 4816296} {"current_steps": 7395, "total_steps": 33920, "loss": 0.5664, "lr": 9.581928998366597e-06, "epoch": 4.3602594339622645, "percentage": 21.8, "elapsed_time": "0:13:48", "remaining_time": "0:49:33", "throughput": 5813.96, "total_tokens": 4819176} {"current_steps": 7400, "total_steps": 33920, "loss": 0.3879, "lr": 9.58089854412833e-06, "epoch": 4.363207547169811, "percentage": 21.82, "elapsed_time": "0:13:49", "remaining_time": "0:49:32", "throughput": 5814.28, "total_tokens": 4822632} {"current_steps": 7405, "total_steps": 33920, "loss": 0.475, "lr": 9.579866877077431e-06, "epoch": 4.366155660377358, "percentage": 21.83, "elapsed_time": "0:13:49", "remaining_time": "0:49:31", "throughput": 5814.24, "total_tokens": 4825480} {"current_steps": 7410, "total_steps": 33920, "loss": 0.4442, "lr": 9.578833997487038e-06, "epoch": 4.369103773584905, "percentage": 21.85, "elapsed_time": "0:13:50", "remaining_time": "0:49:31", "throughput": 5814.48, "total_tokens": 4828712} {"current_steps": 7415, "total_steps": 33920, "loss": 0.418, "lr": 9.57779990563061e-06, "epoch": 4.372051886792453, "percentage": 21.86, "elapsed_time": "0:13:50", "remaining_time": "0:49:30", "throughput": 5814.74, "total_tokens": 4831944} {"current_steps": 7420, "total_steps": 33920, "loss": 0.413, "lr": 9.576764601781928e-06, "epoch": 4.375, "percentage": 21.88, "elapsed_time": "0:13:51", "remaining_time": "0:49:29", "throughput": 5815.01, "total_tokens": 4835528} {"current_steps": 7425, "total_steps": 33920, "loss": 0.4642, "lr": 9.575728086215093e-06, "epoch": 4.377948113207547, "percentage": 21.89, "elapsed_time": "0:13:52", "remaining_time": "0:49:29", "throughput": 5814.65, "total_tokens": 4838152} {"current_steps": 7430, "total_steps": 33920, "loss": 0.5152, "lr": 9.574690359204527e-06, "epoch": 4.380896226415095, "percentage": 21.9, "elapsed_time": "0:13:52", "remaining_time": "0:49:28", "throughput": 5814.21, "total_tokens": 4840520} {"current_steps": 7435, "total_steps": 33920, "loss": 0.3794, "lr": 9.573651421024972e-06, "epoch": 4.383844339622642, "percentage": 21.92, "elapsed_time": "0:13:53", "remaining_time": "0:49:28", "throughput": 5814.92, "total_tokens": 4845064} {"current_steps": 7440, "total_steps": 33920, "loss": 0.5777, "lr": 9.572611271951494e-06, "epoch": 4.386792452830189, "percentage": 21.93, "elapsed_time": "0:13:53", "remaining_time": "0:49:27", "throughput": 5814.57, "total_tokens": 4847464} {"current_steps": 7445, "total_steps": 33920, "loss": 0.5316, "lr": 9.571569912259473e-06, "epoch": 4.3897405660377355, "percentage": 21.95, "elapsed_time": "0:13:54", "remaining_time": "0:49:26", "throughput": 5814.71, "total_tokens": 4850728} {"current_steps": 7450, "total_steps": 33920, "loss": 0.4438, "lr": 9.570527342224614e-06, "epoch": 4.392688679245283, "percentage": 21.96, "elapsed_time": "0:13:54", "remaining_time": "0:49:26", "throughput": 5815.06, "total_tokens": 4854440} {"current_steps": 7455, "total_steps": 33920, "loss": 0.499, "lr": 9.569483562122945e-06, "epoch": 4.39563679245283, "percentage": 21.98, "elapsed_time": "0:13:55", "remaining_time": "0:49:25", "throughput": 5815.46, "total_tokens": 4857960} {"current_steps": 7460, "total_steps": 33920, "loss": 0.3592, "lr": 9.568438572230811e-06, "epoch": 4.398584905660377, "percentage": 21.99, "elapsed_time": "0:13:55", "remaining_time": "0:49:24", "throughput": 5815.34, "total_tokens": 4860840} {"current_steps": 7465, "total_steps": 33920, "loss": 0.4627, "lr": 9.567392372824873e-06, "epoch": 4.401533018867925, "percentage": 22.01, "elapsed_time": "0:13:56", "remaining_time": "0:49:23", "throughput": 5814.91, "total_tokens": 4863240} {"current_steps": 7470, "total_steps": 33920, "loss": 0.4864, "lr": 9.566344964182123e-06, "epoch": 4.404481132075472, "percentage": 22.02, "elapsed_time": "0:13:56", "remaining_time": "0:49:23", "throughput": 5815.11, "total_tokens": 4866248} {"current_steps": 7475, "total_steps": 33920, "loss": 0.3894, "lr": 9.565296346579862e-06, "epoch": 4.407429245283019, "percentage": 22.04, "elapsed_time": "0:13:57", "remaining_time": "0:49:22", "throughput": 5814.96, "total_tokens": 4869256} {"current_steps": 7480, "total_steps": 33920, "loss": 0.5238, "lr": 9.564246520295719e-06, "epoch": 4.410377358490566, "percentage": 22.05, "elapsed_time": "0:13:57", "remaining_time": "0:49:21", "throughput": 5814.91, "total_tokens": 4871912} {"current_steps": 7485, "total_steps": 33920, "loss": 0.4309, "lr": 9.563195485607638e-06, "epoch": 4.413325471698113, "percentage": 22.07, "elapsed_time": "0:13:58", "remaining_time": "0:49:21", "throughput": 5815.19, "total_tokens": 4875944} {"current_steps": 7490, "total_steps": 33920, "loss": 0.4546, "lr": 9.562143242793885e-06, "epoch": 4.41627358490566, "percentage": 22.08, "elapsed_time": "0:13:58", "remaining_time": "0:49:20", "throughput": 5814.48, "total_tokens": 4878280} {"current_steps": 7495, "total_steps": 33920, "loss": 0.4125, "lr": 9.561089792133048e-06, "epoch": 4.4192216981132075, "percentage": 22.1, "elapsed_time": "0:13:59", "remaining_time": "0:49:19", "throughput": 5814.77, "total_tokens": 4881352} {"current_steps": 7500, "total_steps": 33920, "loss": 0.499, "lr": 9.560035133904031e-06, "epoch": 4.422169811320755, "percentage": 22.11, "elapsed_time": "0:14:00", "remaining_time": "0:49:19", "throughput": 5815.22, "total_tokens": 4884808} {"current_steps": 7505, "total_steps": 33920, "loss": 0.4404, "lr": 9.55897926838606e-06, "epoch": 4.425117924528302, "percentage": 22.13, "elapsed_time": "0:14:00", "remaining_time": "0:49:18", "throughput": 5815.53, "total_tokens": 4888040} {"current_steps": 7510, "total_steps": 33920, "loss": 0.4059, "lr": 9.55792219585868e-06, "epoch": 4.428066037735849, "percentage": 22.14, "elapsed_time": "0:14:01", "remaining_time": "0:49:17", "throughput": 5815.62, "total_tokens": 4891144} {"current_steps": 7515, "total_steps": 33920, "loss": 0.4684, "lr": 9.556863916601754e-06, "epoch": 4.431014150943396, "percentage": 22.16, "elapsed_time": "0:14:01", "remaining_time": "0:49:16", "throughput": 5815.84, "total_tokens": 4894344} {"current_steps": 7520, "total_steps": 33920, "loss": 0.5369, "lr": 9.555804430895467e-06, "epoch": 4.433962264150943, "percentage": 22.17, "elapsed_time": "0:14:02", "remaining_time": "0:49:16", "throughput": 5816.01, "total_tokens": 4897352} {"current_steps": 7525, "total_steps": 33920, "loss": 0.3056, "lr": 9.554743739020325e-06, "epoch": 4.43691037735849, "percentage": 22.18, "elapsed_time": "0:14:02", "remaining_time": "0:49:15", "throughput": 5815.65, "total_tokens": 4900040} {"current_steps": 7530, "total_steps": 33920, "loss": 0.5413, "lr": 9.553681841257146e-06, "epoch": 4.439858490566038, "percentage": 22.2, "elapsed_time": "0:14:03", "remaining_time": "0:49:14", "throughput": 5815.98, "total_tokens": 4903560} {"current_steps": 7535, "total_steps": 33920, "loss": 0.4726, "lr": 9.552618737887073e-06, "epoch": 4.442806603773585, "percentage": 22.21, "elapsed_time": "0:14:03", "remaining_time": "0:49:14", "throughput": 5816.29, "total_tokens": 4907496} {"current_steps": 7540, "total_steps": 33920, "loss": 0.5243, "lr": 9.55155442919157e-06, "epoch": 4.445754716981132, "percentage": 22.23, "elapsed_time": "0:14:04", "remaining_time": "0:49:13", "throughput": 5816.04, "total_tokens": 4910376} {"current_steps": 7545, "total_steps": 33920, "loss": 0.4509, "lr": 9.550488915452416e-06, "epoch": 4.4487028301886795, "percentage": 22.24, "elapsed_time": "0:14:04", "remaining_time": "0:49:13", "throughput": 5816.26, "total_tokens": 4913512} {"current_steps": 7550, "total_steps": 33920, "loss": 0.5485, "lr": 9.54942219695171e-06, "epoch": 4.451650943396227, "percentage": 22.26, "elapsed_time": "0:14:05", "remaining_time": "0:49:12", "throughput": 5816.13, "total_tokens": 4916264} {"current_steps": 7555, "total_steps": 33920, "loss": 0.4777, "lr": 9.54835427397187e-06, "epoch": 4.454599056603773, "percentage": 22.27, "elapsed_time": "0:14:05", "remaining_time": "0:49:11", "throughput": 5816.61, "total_tokens": 4920200} {"current_steps": 7560, "total_steps": 33920, "loss": 0.5433, "lr": 9.547285146795634e-06, "epoch": 4.4575471698113205, "percentage": 22.29, "elapsed_time": "0:14:06", "remaining_time": "0:49:11", "throughput": 5816.68, "total_tokens": 4923304} {"current_steps": 7565, "total_steps": 33920, "loss": 0.5329, "lr": 9.546214815706059e-06, "epoch": 4.460495283018868, "percentage": 22.3, "elapsed_time": "0:14:06", "remaining_time": "0:49:10", "throughput": 5816.74, "total_tokens": 4926312} {"current_steps": 7570, "total_steps": 33920, "loss": 0.3715, "lr": 9.545143280986518e-06, "epoch": 4.463443396226415, "percentage": 22.32, "elapsed_time": "0:14:07", "remaining_time": "0:49:10", "throughput": 5817.22, "total_tokens": 4930280} {"current_steps": 7575, "total_steps": 33920, "loss": 0.5294, "lr": 9.544070542920703e-06, "epoch": 4.466391509433962, "percentage": 22.33, "elapsed_time": "0:14:08", "remaining_time": "0:49:09", "throughput": 5817.62, "total_tokens": 4934024} {"current_steps": 7580, "total_steps": 33920, "loss": 0.552, "lr": 9.542996601792629e-06, "epoch": 4.46933962264151, "percentage": 22.35, "elapsed_time": "0:14:08", "remaining_time": "0:49:08", "throughput": 5817.61, "total_tokens": 4937096} {"current_steps": 7585, "total_steps": 33920, "loss": 0.5132, "lr": 9.541921457886624e-06, "epoch": 4.472287735849057, "percentage": 22.36, "elapsed_time": "0:14:09", "remaining_time": "0:49:08", "throughput": 5817.54, "total_tokens": 4939848} {"current_steps": 7590, "total_steps": 33920, "loss": 0.4083, "lr": 9.54084511148734e-06, "epoch": 4.475235849056604, "percentage": 22.38, "elapsed_time": "0:14:09", "remaining_time": "0:49:07", "throughput": 5817.65, "total_tokens": 4942696} {"current_steps": 7595, "total_steps": 33920, "loss": 0.4343, "lr": 9.539767562879742e-06, "epoch": 4.478183962264151, "percentage": 22.39, "elapsed_time": "0:14:10", "remaining_time": "0:49:06", "throughput": 5817.6, "total_tokens": 4945704} {"current_steps": 7600, "total_steps": 33920, "loss": 0.5065, "lr": 9.538688812349118e-06, "epoch": 4.481132075471698, "percentage": 22.41, "elapsed_time": "0:14:10", "remaining_time": "0:49:05", "throughput": 5817.5, "total_tokens": 4948680} {"current_steps": 7605, "total_steps": 33920, "loss": 0.437, "lr": 9.537608860181069e-06, "epoch": 4.484080188679245, "percentage": 22.42, "elapsed_time": "0:14:11", "remaining_time": "0:49:05", "throughput": 5817.41, "total_tokens": 4951688} {"current_steps": 7610, "total_steps": 33920, "loss": 0.5244, "lr": 9.536527706661519e-06, "epoch": 4.4870283018867925, "percentage": 22.44, "elapsed_time": "0:14:11", "remaining_time": "0:49:04", "throughput": 5818.06, "total_tokens": 4955752} {"current_steps": 7615, "total_steps": 33920, "loss": 0.3742, "lr": 9.535445352076707e-06, "epoch": 4.48997641509434, "percentage": 22.45, "elapsed_time": "0:14:12", "remaining_time": "0:49:04", "throughput": 5818.18, "total_tokens": 4958888} {"current_steps": 7620, "total_steps": 33920, "loss": 0.4895, "lr": 9.534361796713191e-06, "epoch": 4.492924528301887, "percentage": 22.46, "elapsed_time": "0:14:12", "remaining_time": "0:49:03", "throughput": 5818.36, "total_tokens": 4961992} {"current_steps": 7625, "total_steps": 33920, "loss": 0.4034, "lr": 9.533277040857847e-06, "epoch": 4.495872641509434, "percentage": 22.48, "elapsed_time": "0:14:13", "remaining_time": "0:49:02", "throughput": 5818.31, "total_tokens": 4964616} {"current_steps": 7630, "total_steps": 33920, "loss": 0.3751, "lr": 9.53219108479787e-06, "epoch": 4.498820754716981, "percentage": 22.49, "elapsed_time": "0:14:13", "remaining_time": "0:49:01", "throughput": 5818.66, "total_tokens": 4967912} {"current_steps": 7635, "total_steps": 33920, "loss": 0.2893, "lr": 9.53110392882077e-06, "epoch": 4.501768867924528, "percentage": 22.51, "elapsed_time": "0:14:14", "remaining_time": "0:49:00", "throughput": 5818.17, "total_tokens": 4970280} {"current_steps": 7640, "total_steps": 33920, "loss": 0.467, "lr": 9.530015573214378e-06, "epoch": 4.504716981132075, "percentage": 22.52, "elapsed_time": "0:14:14", "remaining_time": "0:49:00", "throughput": 5818.13, "total_tokens": 4973224} {"current_steps": 7645, "total_steps": 33920, "loss": 0.5468, "lr": 9.528926018266837e-06, "epoch": 4.507665094339623, "percentage": 22.54, "elapsed_time": "0:14:15", "remaining_time": "0:48:59", "throughput": 5818.56, "total_tokens": 4976808} {"current_steps": 7650, "total_steps": 33920, "loss": 0.5315, "lr": 9.527835264266617e-06, "epoch": 4.51061320754717, "percentage": 22.55, "elapsed_time": "0:14:16", "remaining_time": "0:48:59", "throughput": 5819.77, "total_tokens": 4982312} {"current_steps": 7655, "total_steps": 33920, "loss": 0.4115, "lr": 9.526743311502496e-06, "epoch": 4.513561320754717, "percentage": 22.57, "elapsed_time": "0:14:16", "remaining_time": "0:48:58", "throughput": 5819.5, "total_tokens": 4984744} {"current_steps": 7660, "total_steps": 33920, "loss": 0.4663, "lr": 9.525650160263573e-06, "epoch": 4.5165094339622645, "percentage": 22.58, "elapsed_time": "0:14:17", "remaining_time": "0:48:58", "throughput": 5819.84, "total_tokens": 4987816} {"current_steps": 7665, "total_steps": 33920, "loss": 0.5458, "lr": 9.524555810839267e-06, "epoch": 4.519457547169811, "percentage": 22.6, "elapsed_time": "0:14:17", "remaining_time": "0:48:57", "throughput": 5819.98, "total_tokens": 4990856} {"current_steps": 7670, "total_steps": 33920, "loss": 0.3345, "lr": 9.523460263519309e-06, "epoch": 4.522405660377358, "percentage": 22.61, "elapsed_time": "0:14:18", "remaining_time": "0:48:56", "throughput": 5819.66, "total_tokens": 4993384} {"current_steps": 7675, "total_steps": 33920, "loss": 0.4313, "lr": 9.522363518593753e-06, "epoch": 4.525353773584905, "percentage": 22.63, "elapsed_time": "0:14:18", "remaining_time": "0:48:55", "throughput": 5820.09, "total_tokens": 4996872} {"current_steps": 7680, "total_steps": 33920, "loss": 0.4791, "lr": 9.521265576352963e-06, "epoch": 4.528301886792453, "percentage": 22.64, "elapsed_time": "0:14:19", "remaining_time": "0:48:55", "throughput": 5819.65, "total_tokens": 4999304} {"current_steps": 7685, "total_steps": 33920, "loss": 0.5386, "lr": 9.520166437087628e-06, "epoch": 4.53125, "percentage": 22.66, "elapsed_time": "0:14:19", "remaining_time": "0:48:54", "throughput": 5819.9, "total_tokens": 5002760} {"current_steps": 7690, "total_steps": 33920, "loss": 0.3854, "lr": 9.519066101088748e-06, "epoch": 4.534198113207547, "percentage": 22.67, "elapsed_time": "0:14:20", "remaining_time": "0:48:53", "throughput": 5819.89, "total_tokens": 5005704} {"current_steps": 7695, "total_steps": 33920, "loss": 0.3951, "lr": 9.51796456864764e-06, "epoch": 4.537146226415095, "percentage": 22.69, "elapsed_time": "0:14:20", "remaining_time": "0:48:52", "throughput": 5819.97, "total_tokens": 5008616} {"current_steps": 7700, "total_steps": 33920, "loss": 0.4036, "lr": 9.516861840055942e-06, "epoch": 4.540094339622642, "percentage": 22.7, "elapsed_time": "0:14:21", "remaining_time": "0:48:52", "throughput": 5819.98, "total_tokens": 5011624} {"current_steps": 7705, "total_steps": 33920, "loss": 0.5455, "lr": 9.515757915605604e-06, "epoch": 4.543042452830189, "percentage": 22.72, "elapsed_time": "0:14:21", "remaining_time": "0:48:51", "throughput": 5820.12, "total_tokens": 5014760} {"current_steps": 7710, "total_steps": 33920, "loss": 0.4415, "lr": 9.514652795588899e-06, "epoch": 4.5459905660377355, "percentage": 22.73, "elapsed_time": "0:14:22", "remaining_time": "0:48:50", "throughput": 5820.52, "total_tokens": 5018184} {"current_steps": 7715, "total_steps": 33920, "loss": 0.5423, "lr": 9.513546480298405e-06, "epoch": 4.548938679245283, "percentage": 22.74, "elapsed_time": "0:14:22", "remaining_time": "0:48:50", "throughput": 5820.82, "total_tokens": 5021448} {"current_steps": 7720, "total_steps": 33920, "loss": 0.4206, "lr": 9.512438970027032e-06, "epoch": 4.55188679245283, "percentage": 22.76, "elapsed_time": "0:14:23", "remaining_time": "0:48:49", "throughput": 5820.86, "total_tokens": 5024456} {"current_steps": 7725, "total_steps": 33920, "loss": 0.4736, "lr": 9.511330265067992e-06, "epoch": 4.554834905660377, "percentage": 22.77, "elapsed_time": "0:14:23", "remaining_time": "0:48:48", "throughput": 5820.41, "total_tokens": 5026792} {"current_steps": 7730, "total_steps": 33920, "loss": 0.3369, "lr": 9.510220365714822e-06, "epoch": 4.557783018867925, "percentage": 22.79, "elapsed_time": "0:14:24", "remaining_time": "0:48:47", "throughput": 5820.11, "total_tokens": 5029128} {"current_steps": 7735, "total_steps": 33920, "loss": 0.3452, "lr": 9.509109272261373e-06, "epoch": 4.560731132075472, "percentage": 22.8, "elapsed_time": "0:14:24", "remaining_time": "0:48:47", "throughput": 5820.83, "total_tokens": 5033064} {"current_steps": 7740, "total_steps": 33920, "loss": 0.3933, "lr": 9.50799698500181e-06, "epoch": 4.563679245283019, "percentage": 22.82, "elapsed_time": "0:14:25", "remaining_time": "0:48:46", "throughput": 5821.07, "total_tokens": 5036392} {"current_steps": 7745, "total_steps": 33920, "loss": 0.4035, "lr": 9.506883504230618e-06, "epoch": 4.566627358490566, "percentage": 22.83, "elapsed_time": "0:14:25", "remaining_time": "0:48:45", "throughput": 5821.7, "total_tokens": 5040296} {"current_steps": 7750, "total_steps": 33920, "loss": 0.4266, "lr": 9.505768830242593e-06, "epoch": 4.569575471698113, "percentage": 22.85, "elapsed_time": "0:14:26", "remaining_time": "0:48:45", "throughput": 5822.14, "total_tokens": 5043688} {"current_steps": 7755, "total_steps": 33920, "loss": 0.489, "lr": 9.504652963332852e-06, "epoch": 4.57252358490566, "percentage": 22.86, "elapsed_time": "0:14:26", "remaining_time": "0:48:44", "throughput": 5821.96, "total_tokens": 5046152} {"current_steps": 7760, "total_steps": 33920, "loss": 0.496, "lr": 9.503535903796825e-06, "epoch": 4.5754716981132075, "percentage": 22.88, "elapsed_time": "0:14:27", "remaining_time": "0:48:43", "throughput": 5821.08, "total_tokens": 5048360} {"current_steps": 7765, "total_steps": 33920, "loss": 0.3689, "lr": 9.50241765193026e-06, "epoch": 4.578419811320755, "percentage": 22.89, "elapsed_time": "0:14:27", "remaining_time": "0:48:42", "throughput": 5820.86, "total_tokens": 5051112} {"current_steps": 7770, "total_steps": 33920, "loss": 0.4181, "lr": 9.501298208029214e-06, "epoch": 4.581367924528302, "percentage": 22.91, "elapsed_time": "0:14:28", "remaining_time": "0:48:42", "throughput": 5820.47, "total_tokens": 5053480} {"current_steps": 7775, "total_steps": 33920, "loss": 0.3971, "lr": 9.500177572390071e-06, "epoch": 4.584316037735849, "percentage": 22.92, "elapsed_time": "0:14:28", "remaining_time": "0:48:41", "throughput": 5820.74, "total_tokens": 5057000} {"current_steps": 7780, "total_steps": 33920, "loss": 0.4833, "lr": 9.49905574530952e-06, "epoch": 4.587264150943396, "percentage": 22.94, "elapsed_time": "0:14:29", "remaining_time": "0:48:40", "throughput": 5820.84, "total_tokens": 5060072} {"current_steps": 7785, "total_steps": 33920, "loss": 0.626, "lr": 9.497932727084571e-06, "epoch": 4.590212264150943, "percentage": 22.95, "elapsed_time": "0:14:29", "remaining_time": "0:48:39", "throughput": 5820.57, "total_tokens": 5062568} {"current_steps": 7790, "total_steps": 33920, "loss": 0.4124, "lr": 9.496808518012545e-06, "epoch": 4.59316037735849, "percentage": 22.97, "elapsed_time": "0:14:30", "remaining_time": "0:48:39", "throughput": 5821.25, "total_tokens": 5066600} {"current_steps": 7795, "total_steps": 33920, "loss": 0.4609, "lr": 9.495683118391087e-06, "epoch": 4.596108490566038, "percentage": 22.98, "elapsed_time": "0:14:30", "remaining_time": "0:48:38", "throughput": 5821.25, "total_tokens": 5069384} {"current_steps": 7800, "total_steps": 33920, "loss": 0.4144, "lr": 9.494556528518146e-06, "epoch": 4.599056603773585, "percentage": 23.0, "elapsed_time": "0:14:31", "remaining_time": "0:48:37", "throughput": 5821.45, "total_tokens": 5072520} {"current_steps": 7805, "total_steps": 33920, "loss": 0.5683, "lr": 9.493428748691995e-06, "epoch": 4.602004716981132, "percentage": 23.01, "elapsed_time": "0:14:31", "remaining_time": "0:48:37", "throughput": 5821.19, "total_tokens": 5075208} {"current_steps": 7810, "total_steps": 33920, "loss": 0.3866, "lr": 9.492299779211215e-06, "epoch": 4.6049528301886795, "percentage": 23.02, "elapsed_time": "0:14:32", "remaining_time": "0:48:36", "throughput": 5821.2, "total_tokens": 5077992} {"current_steps": 7815, "total_steps": 33920, "loss": 0.6076, "lr": 9.49116962037471e-06, "epoch": 4.607900943396227, "percentage": 23.04, "elapsed_time": "0:14:32", "remaining_time": "0:48:35", "throughput": 5820.85, "total_tokens": 5080456} {"current_steps": 7820, "total_steps": 33920, "loss": 0.4501, "lr": 9.490038272481691e-06, "epoch": 4.610849056603773, "percentage": 23.05, "elapsed_time": "0:14:33", "remaining_time": "0:48:34", "throughput": 5821.25, "total_tokens": 5084168} {"current_steps": 7825, "total_steps": 33920, "loss": 0.492, "lr": 9.488905735831689e-06, "epoch": 4.6137971698113205, "percentage": 23.07, "elapsed_time": "0:14:33", "remaining_time": "0:48:34", "throughput": 5821.18, "total_tokens": 5086824} {"current_steps": 7830, "total_steps": 33920, "loss": 0.3705, "lr": 9.487772010724548e-06, "epoch": 4.616745283018868, "percentage": 23.08, "elapsed_time": "0:14:34", "remaining_time": "0:48:33", "throughput": 5821.41, "total_tokens": 5089928} {"current_steps": 7835, "total_steps": 33920, "loss": 0.3599, "lr": 9.486637097460425e-06, "epoch": 4.619693396226415, "percentage": 23.1, "elapsed_time": "0:14:34", "remaining_time": "0:48:32", "throughput": 5822.12, "total_tokens": 5093928} {"current_steps": 7840, "total_steps": 33920, "loss": 0.404, "lr": 9.485500996339793e-06, "epoch": 4.622641509433962, "percentage": 23.11, "elapsed_time": "0:14:35", "remaining_time": "0:48:32", "throughput": 5822.1, "total_tokens": 5096680} {"current_steps": 7845, "total_steps": 33920, "loss": 0.4298, "lr": 9.484363707663443e-06, "epoch": 4.62558962264151, "percentage": 23.13, "elapsed_time": "0:14:35", "remaining_time": "0:48:31", "throughput": 5822.2, "total_tokens": 5099496} {"current_steps": 7850, "total_steps": 33920, "loss": 0.5356, "lr": 9.483225231732474e-06, "epoch": 4.628537735849057, "percentage": 23.14, "elapsed_time": "0:14:36", "remaining_time": "0:48:30", "throughput": 5822.08, "total_tokens": 5102472} {"current_steps": 7855, "total_steps": 33920, "loss": 0.4106, "lr": 9.482085568848302e-06, "epoch": 4.631485849056604, "percentage": 23.16, "elapsed_time": "0:14:36", "remaining_time": "0:48:29", "throughput": 5822.42, "total_tokens": 5105768} {"current_steps": 7860, "total_steps": 33920, "loss": 0.6216, "lr": 9.480944719312659e-06, "epoch": 4.634433962264151, "percentage": 23.17, "elapsed_time": "0:14:37", "remaining_time": "0:48:29", "throughput": 5822.8, "total_tokens": 5109224} {"current_steps": 7865, "total_steps": 33920, "loss": 0.5203, "lr": 9.47980268342759e-06, "epoch": 4.637382075471698, "percentage": 23.19, "elapsed_time": "0:14:38", "remaining_time": "0:48:28", "throughput": 5822.74, "total_tokens": 5112392} {"current_steps": 7870, "total_steps": 33920, "loss": 0.4738, "lr": 9.478659461495456e-06, "epoch": 4.640330188679245, "percentage": 23.2, "elapsed_time": "0:14:38", "remaining_time": "0:48:27", "throughput": 5821.82, "total_tokens": 5114376} {"current_steps": 7875, "total_steps": 33920, "loss": 0.4424, "lr": 9.477515053818926e-06, "epoch": 4.6432783018867925, "percentage": 23.22, "elapsed_time": "0:14:39", "remaining_time": "0:48:27", "throughput": 5822.57, "total_tokens": 5118536} {"current_steps": 7880, "total_steps": 33920, "loss": 0.4267, "lr": 9.476369460700988e-06, "epoch": 4.64622641509434, "percentage": 23.23, "elapsed_time": "0:14:39", "remaining_time": "0:48:26", "throughput": 5822.75, "total_tokens": 5121736} {"current_steps": 7885, "total_steps": 33920, "loss": 0.4979, "lr": 9.475222682444944e-06, "epoch": 4.649174528301887, "percentage": 23.25, "elapsed_time": "0:14:40", "remaining_time": "0:48:25", "throughput": 5822.74, "total_tokens": 5124520} {"current_steps": 7890, "total_steps": 33920, "loss": 0.4655, "lr": 9.474074719354406e-06, "epoch": 4.652122641509434, "percentage": 23.26, "elapsed_time": "0:14:40", "remaining_time": "0:48:25", "throughput": 5823.11, "total_tokens": 5127912} {"current_steps": 7895, "total_steps": 33920, "loss": 0.4555, "lr": 9.472925571733306e-06, "epoch": 4.655070754716981, "percentage": 23.28, "elapsed_time": "0:14:41", "remaining_time": "0:48:24", "throughput": 5823.12, "total_tokens": 5130824} {"current_steps": 7900, "total_steps": 33920, "loss": 0.4919, "lr": 9.471775239885883e-06, "epoch": 4.658018867924528, "percentage": 23.29, "elapsed_time": "0:14:41", "remaining_time": "0:48:23", "throughput": 5823.39, "total_tokens": 5134024} {"current_steps": 7905, "total_steps": 33920, "loss": 0.4143, "lr": 9.470623724116693e-06, "epoch": 4.660966981132075, "percentage": 23.3, "elapsed_time": "0:14:42", "remaining_time": "0:48:23", "throughput": 5823.98, "total_tokens": 5137672} {"current_steps": 7910, "total_steps": 33920, "loss": 0.4364, "lr": 9.469471024730606e-06, "epoch": 4.663915094339623, "percentage": 23.32, "elapsed_time": "0:14:42", "remaining_time": "0:48:22", "throughput": 5824.44, "total_tokens": 5141480} {"current_steps": 7915, "total_steps": 33920, "loss": 0.5073, "lr": 9.4683171420328e-06, "epoch": 4.66686320754717, "percentage": 23.33, "elapsed_time": "0:14:43", "remaining_time": "0:48:22", "throughput": 5824.95, "total_tokens": 5145800} {"current_steps": 7920, "total_steps": 33920, "loss": 0.4013, "lr": 9.467162076328776e-06, "epoch": 4.669811320754717, "percentage": 23.35, "elapsed_time": "0:14:43", "remaining_time": "0:48:21", "throughput": 5825.18, "total_tokens": 5149320} {"current_steps": 7925, "total_steps": 33920, "loss": 0.5339, "lr": 9.466005827924337e-06, "epoch": 4.6727594339622645, "percentage": 23.36, "elapsed_time": "0:14:44", "remaining_time": "0:48:21", "throughput": 5825.02, "total_tokens": 5152072} {"current_steps": 7930, "total_steps": 33920, "loss": 0.6446, "lr": 9.46484839712561e-06, "epoch": 4.675707547169811, "percentage": 23.38, "elapsed_time": "0:14:44", "remaining_time": "0:48:20", "throughput": 5825.26, "total_tokens": 5155304} {"current_steps": 7935, "total_steps": 33920, "loss": 0.4136, "lr": 9.463689784239026e-06, "epoch": 4.678655660377358, "percentage": 23.39, "elapsed_time": "0:14:45", "remaining_time": "0:48:19", "throughput": 5825.23, "total_tokens": 5158216} {"current_steps": 7940, "total_steps": 33920, "loss": 0.4616, "lr": 9.462529989571334e-06, "epoch": 4.681603773584905, "percentage": 23.41, "elapsed_time": "0:14:46", "remaining_time": "0:48:19", "throughput": 5825.75, "total_tokens": 5161896} {"current_steps": 7945, "total_steps": 33920, "loss": 0.5737, "lr": 9.461369013429595e-06, "epoch": 4.684551886792453, "percentage": 23.42, "elapsed_time": "0:14:46", "remaining_time": "0:48:19", "throughput": 5826.51, "total_tokens": 5167880} {"current_steps": 7950, "total_steps": 33920, "loss": 0.5744, "lr": 9.460206856121183e-06, "epoch": 4.6875, "percentage": 23.44, "elapsed_time": "0:14:47", "remaining_time": "0:48:19", "throughput": 5826.87, "total_tokens": 5171112} {"current_steps": 7955, "total_steps": 33920, "loss": 0.4463, "lr": 9.459043517953786e-06, "epoch": 4.690448113207547, "percentage": 23.45, "elapsed_time": "0:14:48", "remaining_time": "0:48:18", "throughput": 5827.46, "total_tokens": 5174920} {"current_steps": 7960, "total_steps": 33920, "loss": 0.4516, "lr": 9.457878999235396e-06, "epoch": 4.693396226415095, "percentage": 23.47, "elapsed_time": "0:14:48", "remaining_time": "0:48:17", "throughput": 5827.8, "total_tokens": 5178088} {"current_steps": 7965, "total_steps": 33920, "loss": 0.6278, "lr": 9.45671330027433e-06, "epoch": 4.696344339622642, "percentage": 23.48, "elapsed_time": "0:14:49", "remaining_time": "0:48:17", "throughput": 5828.2, "total_tokens": 5181448} {"current_steps": 7970, "total_steps": 33920, "loss": 0.4615, "lr": 9.45554642137921e-06, "epoch": 4.699292452830189, "percentage": 23.5, "elapsed_time": "0:14:49", "remaining_time": "0:48:16", "throughput": 5828.08, "total_tokens": 5183976} {"current_steps": 7975, "total_steps": 33920, "loss": 0.37, "lr": 9.454378362858974e-06, "epoch": 4.7022405660377355, "percentage": 23.51, "elapsed_time": "0:14:50", "remaining_time": "0:48:15", "throughput": 5828.64, "total_tokens": 5187688} {"current_steps": 7980, "total_steps": 33920, "loss": 0.6165, "lr": 9.453209125022867e-06, "epoch": 4.705188679245283, "percentage": 23.53, "elapsed_time": "0:14:50", "remaining_time": "0:48:14", "throughput": 5828.64, "total_tokens": 5190504} {"current_steps": 7985, "total_steps": 33920, "loss": 0.4526, "lr": 9.452038708180453e-06, "epoch": 4.70813679245283, "percentage": 23.54, "elapsed_time": "0:14:50", "remaining_time": "0:48:13", "throughput": 5828.59, "total_tokens": 5193032} {"current_steps": 7990, "total_steps": 33920, "loss": 0.4659, "lr": 9.450867112641603e-06, "epoch": 4.711084905660377, "percentage": 23.56, "elapsed_time": "0:14:51", "remaining_time": "0:48:13", "throughput": 5829.09, "total_tokens": 5196968} {"current_steps": 7995, "total_steps": 33920, "loss": 0.4777, "lr": 9.449694338716506e-06, "epoch": 4.714033018867925, "percentage": 23.57, "elapsed_time": "0:14:52", "remaining_time": "0:48:12", "throughput": 5829.05, "total_tokens": 5199848} {"current_steps": 8000, "total_steps": 33920, "loss": 0.4135, "lr": 9.448520386715653e-06, "epoch": 4.716981132075472, "percentage": 23.58, "elapsed_time": "0:14:52", "remaining_time": "0:48:12", "throughput": 5829.77, "total_tokens": 5204040} {"current_steps": 8005, "total_steps": 33920, "loss": 0.3828, "lr": 9.447345256949855e-06, "epoch": 4.719929245283019, "percentage": 23.6, "elapsed_time": "0:14:53", "remaining_time": "0:48:11", "throughput": 5830.15, "total_tokens": 5207240} {"current_steps": 8010, "total_steps": 33920, "loss": 0.5591, "lr": 9.446168949730234e-06, "epoch": 4.722877358490566, "percentage": 23.61, "elapsed_time": "0:14:53", "remaining_time": "0:48:10", "throughput": 5830.33, "total_tokens": 5210312} {"current_steps": 8015, "total_steps": 33920, "loss": 0.4712, "lr": 9.444991465368223e-06, "epoch": 4.725825471698113, "percentage": 23.63, "elapsed_time": "0:14:54", "remaining_time": "0:48:10", "throughput": 5831.16, "total_tokens": 5214760} {"current_steps": 8020, "total_steps": 33920, "loss": 0.5624, "lr": 9.443812804175562e-06, "epoch": 4.72877358490566, "percentage": 23.64, "elapsed_time": "0:14:54", "remaining_time": "0:48:09", "throughput": 5831.46, "total_tokens": 5217960} {"current_steps": 8025, "total_steps": 33920, "loss": 0.4757, "lr": 9.44263296646431e-06, "epoch": 4.7317216981132075, "percentage": 23.66, "elapsed_time": "0:14:55", "remaining_time": "0:48:09", "throughput": 5831.99, "total_tokens": 5221576} {"current_steps": 8030, "total_steps": 33920, "loss": 0.5286, "lr": 9.441451952546835e-06, "epoch": 4.734669811320755, "percentage": 23.67, "elapsed_time": "0:14:55", "remaining_time": "0:48:08", "throughput": 5832.24, "total_tokens": 5225160} {"current_steps": 8035, "total_steps": 33920, "loss": 0.456, "lr": 9.440269762735814e-06, "epoch": 4.737617924528302, "percentage": 23.69, "elapsed_time": "0:14:56", "remaining_time": "0:48:07", "throughput": 5832.35, "total_tokens": 5228072} {"current_steps": 8040, "total_steps": 33920, "loss": 0.4229, "lr": 9.439086397344236e-06, "epoch": 4.740566037735849, "percentage": 23.7, "elapsed_time": "0:14:56", "remaining_time": "0:48:06", "throughput": 5832.59, "total_tokens": 5231112} {"current_steps": 8045, "total_steps": 33920, "loss": 0.3379, "lr": 9.437901856685404e-06, "epoch": 4.743514150943396, "percentage": 23.72, "elapsed_time": "0:14:57", "remaining_time": "0:48:06", "throughput": 5832.89, "total_tokens": 5234440} {"current_steps": 8050, "total_steps": 33920, "loss": 0.3924, "lr": 9.436716141072925e-06, "epoch": 4.746462264150943, "percentage": 23.73, "elapsed_time": "0:14:57", "remaining_time": "0:48:05", "throughput": 5833.28, "total_tokens": 5237960} {"current_steps": 8055, "total_steps": 33920, "loss": 0.3906, "lr": 9.435529250820732e-06, "epoch": 4.74941037735849, "percentage": 23.75, "elapsed_time": "0:14:58", "remaining_time": "0:48:04", "throughput": 5832.9, "total_tokens": 5240616} {"current_steps": 8060, "total_steps": 33920, "loss": 0.3462, "lr": 9.43434118624305e-06, "epoch": 4.752358490566038, "percentage": 23.76, "elapsed_time": "0:14:58", "remaining_time": "0:48:04", "throughput": 5832.98, "total_tokens": 5243784} {"current_steps": 8065, "total_steps": 33920, "loss": 0.4659, "lr": 9.433151947654428e-06, "epoch": 4.755306603773585, "percentage": 23.78, "elapsed_time": "0:14:59", "remaining_time": "0:48:03", "throughput": 5833.25, "total_tokens": 5247016} {"current_steps": 8070, "total_steps": 33920, "loss": 0.6033, "lr": 9.431961535369724e-06, "epoch": 4.758254716981132, "percentage": 23.79, "elapsed_time": "0:15:00", "remaining_time": "0:48:03", "throughput": 5833.54, "total_tokens": 5250504} {"current_steps": 8075, "total_steps": 33920, "loss": 0.5665, "lr": 9.430769949704103e-06, "epoch": 4.7612028301886795, "percentage": 23.81, "elapsed_time": "0:15:00", "remaining_time": "0:48:02", "throughput": 5834.01, "total_tokens": 5254056} {"current_steps": 8080, "total_steps": 33920, "loss": 0.328, "lr": 9.42957719097304e-06, "epoch": 4.764150943396227, "percentage": 23.82, "elapsed_time": "0:15:01", "remaining_time": "0:48:02", "throughput": 5834.37, "total_tokens": 5257896} {"current_steps": 8085, "total_steps": 33920, "loss": 0.4381, "lr": 9.42838325949233e-06, "epoch": 4.767099056603773, "percentage": 23.84, "elapsed_time": "0:15:01", "remaining_time": "0:48:01", "throughput": 5834.79, "total_tokens": 5261544} {"current_steps": 8090, "total_steps": 33920, "loss": 0.5191, "lr": 9.427188155578062e-06, "epoch": 4.7700471698113205, "percentage": 23.85, "elapsed_time": "0:15:02", "remaining_time": "0:48:00", "throughput": 5835.39, "total_tokens": 5265352} {"current_steps": 8095, "total_steps": 33920, "loss": 0.5181, "lr": 9.42599187954665e-06, "epoch": 4.772995283018868, "percentage": 23.86, "elapsed_time": "0:15:02", "remaining_time": "0:48:00", "throughput": 5835.72, "total_tokens": 5268648} {"current_steps": 8100, "total_steps": 33920, "loss": 0.5463, "lr": 9.424794431714814e-06, "epoch": 4.775943396226415, "percentage": 23.88, "elapsed_time": "0:15:03", "remaining_time": "0:47:59", "throughput": 5836.19, "total_tokens": 5272200} {"current_steps": 8105, "total_steps": 33920, "loss": 0.5231, "lr": 9.423595812399581e-06, "epoch": 4.778891509433962, "percentage": 23.89, "elapsed_time": "0:15:03", "remaining_time": "0:47:58", "throughput": 5836.21, "total_tokens": 5275048} {"current_steps": 8110, "total_steps": 33920, "loss": 0.5194, "lr": 9.422396021918296e-06, "epoch": 4.78183962264151, "percentage": 23.91, "elapsed_time": "0:15:04", "remaining_time": "0:47:58", "throughput": 5836.72, "total_tokens": 5278600} {"current_steps": 8115, "total_steps": 33920, "loss": 0.5531, "lr": 9.421195060588602e-06, "epoch": 4.784787735849057, "percentage": 23.92, "elapsed_time": "0:15:04", "remaining_time": "0:47:57", "throughput": 5837.08, "total_tokens": 5282056} {"current_steps": 8120, "total_steps": 33920, "loss": 0.3538, "lr": 9.419992928728461e-06, "epoch": 4.787735849056604, "percentage": 23.94, "elapsed_time": "0:15:05", "remaining_time": "0:47:56", "throughput": 5837.19, "total_tokens": 5284808} {"current_steps": 8125, "total_steps": 33920, "loss": 0.4442, "lr": 9.418789626656144e-06, "epoch": 4.790683962264151, "percentage": 23.95, "elapsed_time": "0:15:05", "remaining_time": "0:47:55", "throughput": 5837.48, "total_tokens": 5287880} {"current_steps": 8130, "total_steps": 33920, "loss": 0.3562, "lr": 9.417585154690229e-06, "epoch": 4.793632075471698, "percentage": 23.97, "elapsed_time": "0:15:06", "remaining_time": "0:47:55", "throughput": 5837.58, "total_tokens": 5290728} {"current_steps": 8135, "total_steps": 33920, "loss": 0.3286, "lr": 9.416379513149605e-06, "epoch": 4.796580188679245, "percentage": 23.98, "elapsed_time": "0:15:06", "remaining_time": "0:47:54", "throughput": 5837.52, "total_tokens": 5293640} {"current_steps": 8140, "total_steps": 33920, "loss": 0.4564, "lr": 9.415172702353471e-06, "epoch": 4.7995283018867925, "percentage": 24.0, "elapsed_time": "0:15:07", "remaining_time": "0:47:53", "throughput": 5838.01, "total_tokens": 5297768} {"current_steps": 8145, "total_steps": 33920, "loss": 0.4186, "lr": 9.413964722621339e-06, "epoch": 4.80247641509434, "percentage": 24.01, "elapsed_time": "0:15:07", "remaining_time": "0:47:53", "throughput": 5838.09, "total_tokens": 5300680} {"current_steps": 8150, "total_steps": 33920, "loss": 0.5172, "lr": 9.41275557427302e-06, "epoch": 4.805424528301887, "percentage": 24.03, "elapsed_time": "0:15:08", "remaining_time": "0:47:52", "throughput": 5838.38, "total_tokens": 5303880} {"current_steps": 8155, "total_steps": 33920, "loss": 0.4725, "lr": 9.411545257628646e-06, "epoch": 4.808372641509434, "percentage": 24.04, "elapsed_time": "0:15:08", "remaining_time": "0:47:51", "throughput": 5838.47, "total_tokens": 5307048} {"current_steps": 8160, "total_steps": 33920, "loss": 0.3675, "lr": 9.410333773008653e-06, "epoch": 4.811320754716981, "percentage": 24.06, "elapsed_time": "0:15:09", "remaining_time": "0:47:51", "throughput": 5838.74, "total_tokens": 5310088} {"current_steps": 8165, "total_steps": 33920, "loss": 0.4108, "lr": 9.409121120733784e-06, "epoch": 4.814268867924528, "percentage": 24.07, "elapsed_time": "0:15:09", "remaining_time": "0:47:50", "throughput": 5839.09, "total_tokens": 5313320} {"current_steps": 8170, "total_steps": 33920, "loss": 0.4226, "lr": 9.4079073011251e-06, "epoch": 4.817216981132075, "percentage": 24.09, "elapsed_time": "0:15:10", "remaining_time": "0:47:49", "throughput": 5839.68, "total_tokens": 5317480} {"current_steps": 8175, "total_steps": 33920, "loss": 0.5109, "lr": 9.406692314503956e-06, "epoch": 4.820165094339623, "percentage": 24.1, "elapsed_time": "0:15:11", "remaining_time": "0:47:49", "throughput": 5839.61, "total_tokens": 5320168} {"current_steps": 8180, "total_steps": 33920, "loss": 0.3242, "lr": 9.405476161192033e-06, "epoch": 4.82311320754717, "percentage": 24.12, "elapsed_time": "0:15:11", "remaining_time": "0:47:49", "throughput": 5840.57, "total_tokens": 5326472} {"current_steps": 8185, "total_steps": 33920, "loss": 0.4166, "lr": 9.40425884151131e-06, "epoch": 4.826061320754717, "percentage": 24.13, "elapsed_time": "0:15:12", "remaining_time": "0:47:49", "throughput": 5841.23, "total_tokens": 5330728} {"current_steps": 8190, "total_steps": 33920, "loss": 0.5636, "lr": 9.403040355784076e-06, "epoch": 4.8290094339622645, "percentage": 24.15, "elapsed_time": "0:15:13", "remaining_time": "0:47:48", "throughput": 5841.3, "total_tokens": 5333448} {"current_steps": 8195, "total_steps": 33920, "loss": 0.4205, "lr": 9.401820704332932e-06, "epoch": 4.831957547169811, "percentage": 24.16, "elapsed_time": "0:15:13", "remaining_time": "0:47:47", "throughput": 5841.45, "total_tokens": 5336360} {"current_steps": 8200, "total_steps": 33920, "loss": 0.4176, "lr": 9.400599887480786e-06, "epoch": 4.834905660377358, "percentage": 24.17, "elapsed_time": "0:15:14", "remaining_time": "0:47:46", "throughput": 5841.71, "total_tokens": 5339560} {"current_steps": 8205, "total_steps": 33920, "loss": 0.6162, "lr": 9.399377905550854e-06, "epoch": 4.837853773584905, "percentage": 24.19, "elapsed_time": "0:15:14", "remaining_time": "0:47:46", "throughput": 5841.64, "total_tokens": 5342344} {"current_steps": 8210, "total_steps": 33920, "loss": 0.3588, "lr": 9.398154758866662e-06, "epoch": 4.840801886792453, "percentage": 24.2, "elapsed_time": "0:15:15", "remaining_time": "0:47:45", "throughput": 5842.17, "total_tokens": 5346120} {"current_steps": 8215, "total_steps": 33920, "loss": 0.4534, "lr": 9.396930447752041e-06, "epoch": 4.84375, "percentage": 24.22, "elapsed_time": "0:15:16", "remaining_time": "0:47:46", "throughput": 5842.56, "total_tokens": 5352616} {"current_steps": 8220, "total_steps": 33920, "loss": 0.689, "lr": 9.395704972531137e-06, "epoch": 4.846698113207547, "percentage": 24.23, "elapsed_time": "0:15:16", "remaining_time": "0:47:45", "throughput": 5842.54, "total_tokens": 5355464} {"current_steps": 8225, "total_steps": 33920, "loss": 0.4442, "lr": 9.394478333528396e-06, "epoch": 4.849646226415095, "percentage": 24.25, "elapsed_time": "0:15:17", "remaining_time": "0:47:45", "throughput": 5842.52, "total_tokens": 5358504} {"current_steps": 8230, "total_steps": 33920, "loss": 0.364, "lr": 9.393250531068576e-06, "epoch": 4.852594339622642, "percentage": 24.26, "elapsed_time": "0:15:17", "remaining_time": "0:47:44", "throughput": 5842.1, "total_tokens": 5360648} {"current_steps": 8235, "total_steps": 33920, "loss": 0.3551, "lr": 9.392021565476744e-06, "epoch": 4.855542452830189, "percentage": 24.28, "elapsed_time": "0:15:18", "remaining_time": "0:47:44", "throughput": 5842.95, "total_tokens": 5366024} {"current_steps": 8240, "total_steps": 33920, "loss": 0.3379, "lr": 9.390791437078274e-06, "epoch": 4.8584905660377355, "percentage": 24.29, "elapsed_time": "0:15:18", "remaining_time": "0:47:43", "throughput": 5843.36, "total_tokens": 5369352} {"current_steps": 8245, "total_steps": 33920, "loss": 0.4944, "lr": 9.38956014619885e-06, "epoch": 4.861438679245283, "percentage": 24.31, "elapsed_time": "0:15:19", "remaining_time": "0:47:42", "throughput": 5843.3, "total_tokens": 5372104} {"current_steps": 8250, "total_steps": 33920, "loss": 0.6616, "lr": 9.388327693164456e-06, "epoch": 4.86438679245283, "percentage": 24.32, "elapsed_time": "0:15:19", "remaining_time": "0:47:41", "throughput": 5843.35, "total_tokens": 5374728} {"current_steps": 8255, "total_steps": 33920, "loss": 0.4208, "lr": 9.387094078301395e-06, "epoch": 4.867334905660377, "percentage": 24.34, "elapsed_time": "0:15:20", "remaining_time": "0:47:42", "throughput": 5844.04, "total_tokens": 5380328} {"current_steps": 8260, "total_steps": 33920, "loss": 0.3802, "lr": 9.385859301936269e-06, "epoch": 4.870283018867925, "percentage": 24.35, "elapsed_time": "0:15:21", "remaining_time": "0:47:41", "throughput": 5844.64, "total_tokens": 5384488} {"current_steps": 8265, "total_steps": 33920, "loss": 0.3822, "lr": 9.38462336439599e-06, "epoch": 4.873231132075472, "percentage": 24.37, "elapsed_time": "0:15:21", "remaining_time": "0:47:41", "throughput": 5844.33, "total_tokens": 5386888} {"current_steps": 8270, "total_steps": 33920, "loss": 0.5905, "lr": 9.383386266007779e-06, "epoch": 4.876179245283019, "percentage": 24.38, "elapsed_time": "0:15:22", "remaining_time": "0:47:40", "throughput": 5844.33, "total_tokens": 5389576} {"current_steps": 8275, "total_steps": 33920, "loss": 0.4105, "lr": 9.382148007099164e-06, "epoch": 4.879127358490566, "percentage": 24.4, "elapsed_time": "0:15:22", "remaining_time": "0:47:39", "throughput": 5844.53, "total_tokens": 5392744} {"current_steps": 8280, "total_steps": 33920, "loss": 0.3934, "lr": 9.380908587997977e-06, "epoch": 4.882075471698113, "percentage": 24.41, "elapsed_time": "0:15:23", "remaining_time": "0:47:38", "throughput": 5844.96, "total_tokens": 5396328} {"current_steps": 8285, "total_steps": 33920, "loss": 0.3989, "lr": 9.37966800903236e-06, "epoch": 4.88502358490566, "percentage": 24.43, "elapsed_time": "0:15:23", "remaining_time": "0:47:38", "throughput": 5845.26, "total_tokens": 5399496} {"current_steps": 8290, "total_steps": 33920, "loss": 0.4764, "lr": 9.378426270530762e-06, "epoch": 4.8879716981132075, "percentage": 24.44, "elapsed_time": "0:15:24", "remaining_time": "0:47:37", "throughput": 5845.19, "total_tokens": 5402312} {"current_steps": 8295, "total_steps": 33920, "loss": 0.4632, "lr": 9.37718337282194e-06, "epoch": 4.890919811320755, "percentage": 24.45, "elapsed_time": "0:15:24", "remaining_time": "0:47:36", "throughput": 5845.68, "total_tokens": 5405928} {"current_steps": 8300, "total_steps": 33920, "loss": 0.4719, "lr": 9.375939316234956e-06, "epoch": 4.893867924528302, "percentage": 24.47, "elapsed_time": "0:15:25", "remaining_time": "0:47:36", "throughput": 5846.14, "total_tokens": 5409608} {"current_steps": 8305, "total_steps": 33920, "loss": 0.4291, "lr": 9.374694101099178e-06, "epoch": 4.896816037735849, "percentage": 24.48, "elapsed_time": "0:15:25", "remaining_time": "0:47:35", "throughput": 5846.42, "total_tokens": 5412744} {"current_steps": 8310, "total_steps": 33920, "loss": 0.4423, "lr": 9.373447727744282e-06, "epoch": 4.899764150943396, "percentage": 24.5, "elapsed_time": "0:15:26", "remaining_time": "0:47:35", "throughput": 5847.24, "total_tokens": 5417512} {"current_steps": 8315, "total_steps": 33920, "loss": 0.4771, "lr": 9.372200196500253e-06, "epoch": 4.902712264150943, "percentage": 24.51, "elapsed_time": "0:15:27", "remaining_time": "0:47:34", "throughput": 5847.18, "total_tokens": 5420648} {"current_steps": 8320, "total_steps": 33920, "loss": 0.3742, "lr": 9.37095150769738e-06, "epoch": 4.90566037735849, "percentage": 24.53, "elapsed_time": "0:15:27", "remaining_time": "0:47:33", "throughput": 5846.87, "total_tokens": 5423016} {"current_steps": 8325, "total_steps": 33920, "loss": 0.4001, "lr": 9.369701661666255e-06, "epoch": 4.908608490566038, "percentage": 24.54, "elapsed_time": "0:15:27", "remaining_time": "0:47:32", "throughput": 5846.74, "total_tokens": 5425544} {"current_steps": 8330, "total_steps": 33920, "loss": 0.4381, "lr": 9.368450658737782e-06, "epoch": 4.911556603773585, "percentage": 24.56, "elapsed_time": "0:15:28", "remaining_time": "0:47:32", "throughput": 5847.05, "total_tokens": 5429032} {"current_steps": 8335, "total_steps": 33920, "loss": 0.5225, "lr": 9.367198499243173e-06, "epoch": 4.914504716981132, "percentage": 24.57, "elapsed_time": "0:15:28", "remaining_time": "0:47:31", "throughput": 5847.21, "total_tokens": 5432040} {"current_steps": 8340, "total_steps": 33920, "loss": 0.4484, "lr": 9.365945183513938e-06, "epoch": 4.9174528301886795, "percentage": 24.59, "elapsed_time": "0:15:29", "remaining_time": "0:47:30", "throughput": 5847.39, "total_tokens": 5435240} {"current_steps": 8345, "total_steps": 33920, "loss": 0.474, "lr": 9.3646907118819e-06, "epoch": 4.920400943396227, "percentage": 24.6, "elapsed_time": "0:15:30", "remaining_time": "0:47:30", "throughput": 5847.8, "total_tokens": 5438952} {"current_steps": 8350, "total_steps": 33920, "loss": 0.4824, "lr": 9.363435084679185e-06, "epoch": 4.923349056603773, "percentage": 24.62, "elapsed_time": "0:15:30", "remaining_time": "0:47:29", "throughput": 5847.83, "total_tokens": 5441672} {"current_steps": 8355, "total_steps": 33920, "loss": 0.4053, "lr": 9.362178302238227e-06, "epoch": 4.9262971698113205, "percentage": 24.63, "elapsed_time": "0:15:31", "remaining_time": "0:47:28", "throughput": 5847.72, "total_tokens": 5444488} {"current_steps": 8360, "total_steps": 33920, "loss": 0.4813, "lr": 9.360920364891762e-06, "epoch": 4.929245283018868, "percentage": 24.65, "elapsed_time": "0:15:31", "remaining_time": "0:47:28", "throughput": 5847.82, "total_tokens": 5447400} {"current_steps": 8365, "total_steps": 33920, "loss": 0.398, "lr": 9.359661272972836e-06, "epoch": 4.932193396226415, "percentage": 24.66, "elapsed_time": "0:15:32", "remaining_time": "0:47:27", "throughput": 5848.22, "total_tokens": 5451112} {"current_steps": 8370, "total_steps": 33920, "loss": 0.4676, "lr": 9.3584010268148e-06, "epoch": 4.935141509433962, "percentage": 24.68, "elapsed_time": "0:15:32", "remaining_time": "0:47:26", "throughput": 5848.57, "total_tokens": 5454376} {"current_steps": 8375, "total_steps": 33920, "loss": 0.4263, "lr": 9.357139626751308e-06, "epoch": 4.93808962264151, "percentage": 24.69, "elapsed_time": "0:15:33", "remaining_time": "0:47:26", "throughput": 5848.96, "total_tokens": 5457896} {"current_steps": 8380, "total_steps": 33920, "loss": 0.4814, "lr": 9.355877073116321e-06, "epoch": 4.941037735849057, "percentage": 24.71, "elapsed_time": "0:15:33", "remaining_time": "0:47:25", "throughput": 5848.86, "total_tokens": 5460584} {"current_steps": 8385, "total_steps": 33920, "loss": 0.4842, "lr": 9.354613366244108e-06, "epoch": 4.943985849056604, "percentage": 24.72, "elapsed_time": "0:15:34", "remaining_time": "0:47:24", "throughput": 5848.89, "total_tokens": 5463368} {"current_steps": 8390, "total_steps": 33920, "loss": 0.6057, "lr": 9.353348506469236e-06, "epoch": 4.946933962264151, "percentage": 24.73, "elapsed_time": "0:15:34", "remaining_time": "0:47:24", "throughput": 5849.55, "total_tokens": 5467720} {"current_steps": 8395, "total_steps": 33920, "loss": 0.4386, "lr": 9.352082494126586e-06, "epoch": 4.949882075471698, "percentage": 24.75, "elapsed_time": "0:15:35", "remaining_time": "0:47:23", "throughput": 5849.73, "total_tokens": 5470792} {"current_steps": 8400, "total_steps": 33920, "loss": 0.4343, "lr": 9.350815329551341e-06, "epoch": 4.952830188679245, "percentage": 24.76, "elapsed_time": "0:15:35", "remaining_time": "0:47:23", "throughput": 5850.06, "total_tokens": 5474504} {"current_steps": 8405, "total_steps": 33920, "loss": 0.4271, "lr": 9.349547013078986e-06, "epoch": 4.9557783018867925, "percentage": 24.78, "elapsed_time": "0:15:36", "remaining_time": "0:47:22", "throughput": 5850.57, "total_tokens": 5478536} {"current_steps": 8410, "total_steps": 33920, "loss": 0.5504, "lr": 9.348277545045312e-06, "epoch": 4.95872641509434, "percentage": 24.79, "elapsed_time": "0:15:36", "remaining_time": "0:47:21", "throughput": 5850.36, "total_tokens": 5480936} {"current_steps": 8415, "total_steps": 33920, "loss": 0.5185, "lr": 9.347006925786418e-06, "epoch": 4.961674528301887, "percentage": 24.81, "elapsed_time": "0:15:37", "remaining_time": "0:47:21", "throughput": 5850.67, "total_tokens": 5484200} {"current_steps": 8420, "total_steps": 33920, "loss": 0.4222, "lr": 9.34573515563871e-06, "epoch": 4.964622641509434, "percentage": 24.82, "elapsed_time": "0:15:37", "remaining_time": "0:47:20", "throughput": 5850.94, "total_tokens": 5487496} {"current_steps": 8425, "total_steps": 33920, "loss": 0.3243, "lr": 9.344462234938885e-06, "epoch": 4.967570754716981, "percentage": 24.84, "elapsed_time": "0:15:38", "remaining_time": "0:47:19", "throughput": 5850.56, "total_tokens": 5489864} {"current_steps": 8430, "total_steps": 33920, "loss": 0.5222, "lr": 9.343188164023962e-06, "epoch": 4.970518867924528, "percentage": 24.85, "elapsed_time": "0:15:38", "remaining_time": "0:47:19", "throughput": 5851.06, "total_tokens": 5493704} {"current_steps": 8435, "total_steps": 33920, "loss": 0.4547, "lr": 9.341912943231256e-06, "epoch": 4.973466981132075, "percentage": 24.87, "elapsed_time": "0:15:39", "remaining_time": "0:47:19", "throughput": 5851.87, "total_tokens": 5499560} {"current_steps": 8440, "total_steps": 33920, "loss": 0.648, "lr": 9.340636572898383e-06, "epoch": 4.976415094339623, "percentage": 24.88, "elapsed_time": "0:15:40", "remaining_time": "0:47:18", "throughput": 5851.65, "total_tokens": 5501992} {"current_steps": 8445, "total_steps": 33920, "loss": 0.3866, "lr": 9.339359053363272e-06, "epoch": 4.97936320754717, "percentage": 24.9, "elapsed_time": "0:15:40", "remaining_time": "0:47:17", "throughput": 5851.92, "total_tokens": 5505352} {"current_steps": 8450, "total_steps": 33920, "loss": 0.5358, "lr": 9.338080384964148e-06, "epoch": 4.982311320754717, "percentage": 24.91, "elapsed_time": "0:15:41", "remaining_time": "0:47:17", "throughput": 5852.08, "total_tokens": 5508232} {"current_steps": 8455, "total_steps": 33920, "loss": 0.4299, "lr": 9.336800568039548e-06, "epoch": 4.9852594339622645, "percentage": 24.93, "elapsed_time": "0:15:41", "remaining_time": "0:47:16", "throughput": 5852.93, "total_tokens": 5512872} {"current_steps": 8460, "total_steps": 33920, "loss": 0.5236, "lr": 9.335519602928307e-06, "epoch": 4.988207547169811, "percentage": 24.94, "elapsed_time": "0:15:42", "remaining_time": "0:47:16", "throughput": 5853.36, "total_tokens": 5516584} {"current_steps": 8465, "total_steps": 33920, "loss": 0.4382, "lr": 9.334237489969565e-06, "epoch": 4.991155660377358, "percentage": 24.96, "elapsed_time": "0:15:43", "remaining_time": "0:47:15", "throughput": 5853.88, "total_tokens": 5520392} {"current_steps": 8470, "total_steps": 33920, "loss": 0.4476, "lr": 9.332954229502768e-06, "epoch": 4.994103773584905, "percentage": 24.97, "elapsed_time": "0:15:43", "remaining_time": "0:47:15", "throughput": 5854.19, "total_tokens": 5523528} {"current_steps": 8475, "total_steps": 33920, "loss": 0.3976, "lr": 9.331669821867665e-06, "epoch": 4.997051886792453, "percentage": 24.99, "elapsed_time": "0:15:43", "remaining_time": "0:47:14", "throughput": 5854.05, "total_tokens": 5526216} {"current_steps": 8480, "total_steps": 33920, "loss": 0.4917, "lr": 9.33038426740431e-06, "epoch": 5.0, "percentage": 25.0, "elapsed_time": "0:15:44", "remaining_time": "0:47:13", "throughput": 5853.02, "total_tokens": 5528680} {"current_steps": 8485, "total_steps": 33920, "loss": 0.4527, "lr": 9.329097566453055e-06, "epoch": 5.002948113207547, "percentage": 25.01, "elapsed_time": "0:15:45", "remaining_time": "0:47:13", "throughput": 5852.02, "total_tokens": 5531464} {"current_steps": 8490, "total_steps": 33920, "loss": 0.5777, "lr": 9.327809719354564e-06, "epoch": 5.005896226415095, "percentage": 25.03, "elapsed_time": "0:15:45", "remaining_time": "0:47:12", "throughput": 5851.79, "total_tokens": 5534216} {"current_steps": 8495, "total_steps": 33920, "loss": 0.6475, "lr": 9.326520726449795e-06, "epoch": 5.008844339622642, "percentage": 25.04, "elapsed_time": "0:15:46", "remaining_time": "0:47:12", "throughput": 5851.83, "total_tokens": 5537224} {"current_steps": 8500, "total_steps": 33920, "loss": 0.4129, "lr": 9.32523058808002e-06, "epoch": 5.011792452830188, "percentage": 25.06, "elapsed_time": "0:15:46", "remaining_time": "0:47:11", "throughput": 5852.13, "total_tokens": 5540904} {"current_steps": 8505, "total_steps": 33920, "loss": 0.5609, "lr": 9.323939304586806e-06, "epoch": 5.0147405660377355, "percentage": 25.07, "elapsed_time": "0:15:47", "remaining_time": "0:47:10", "throughput": 5852.4, "total_tokens": 5544328} {"current_steps": 8510, "total_steps": 33920, "loss": 0.3596, "lr": 9.322646876312025e-06, "epoch": 5.017688679245283, "percentage": 25.09, "elapsed_time": "0:15:48", "remaining_time": "0:47:11", "throughput": 5853.41, "total_tokens": 5550984} {"current_steps": 8515, "total_steps": 33920, "loss": 0.375, "lr": 9.321353303597854e-06, "epoch": 5.02063679245283, "percentage": 25.1, "elapsed_time": "0:15:48", "remaining_time": "0:47:11", "throughput": 5854.01, "total_tokens": 5555240} {"current_steps": 8520, "total_steps": 33920, "loss": 0.4131, "lr": 9.320058586786771e-06, "epoch": 5.023584905660377, "percentage": 25.12, "elapsed_time": "0:15:49", "remaining_time": "0:47:10", "throughput": 5854.43, "total_tokens": 5559208} {"current_steps": 8525, "total_steps": 33920, "loss": 0.3864, "lr": 9.31876272622156e-06, "epoch": 5.026533018867925, "percentage": 25.13, "elapsed_time": "0:15:50", "remaining_time": "0:47:10", "throughput": 5854.94, "total_tokens": 5562824} {"current_steps": 8530, "total_steps": 33920, "loss": 0.4407, "lr": 9.317465722245305e-06, "epoch": 5.029481132075472, "percentage": 25.15, "elapsed_time": "0:15:50", "remaining_time": "0:47:09", "throughput": 5855.22, "total_tokens": 5566216} {"current_steps": 8535, "total_steps": 33920, "loss": 0.3771, "lr": 9.316167575201391e-06, "epoch": 5.032429245283019, "percentage": 25.16, "elapsed_time": "0:15:51", "remaining_time": "0:47:09", "throughput": 5855.86, "total_tokens": 5570696} {"current_steps": 8540, "total_steps": 33920, "loss": 0.5153, "lr": 9.31486828543351e-06, "epoch": 5.035377358490566, "percentage": 25.18, "elapsed_time": "0:15:51", "remaining_time": "0:47:08", "throughput": 5856.22, "total_tokens": 5574248} {"current_steps": 8545, "total_steps": 33920, "loss": 0.3103, "lr": 9.313567853285656e-06, "epoch": 5.038325471698113, "percentage": 25.19, "elapsed_time": "0:15:52", "remaining_time": "0:47:08", "throughput": 5856.27, "total_tokens": 5577256} {"current_steps": 8550, "total_steps": 33920, "loss": 0.4426, "lr": 9.31226627910212e-06, "epoch": 5.04127358490566, "percentage": 25.21, "elapsed_time": "0:15:52", "remaining_time": "0:47:07", "throughput": 5856.77, "total_tokens": 5580872} {"current_steps": 8555, "total_steps": 33920, "loss": 0.4514, "lr": 9.310963563227504e-06, "epoch": 5.0442216981132075, "percentage": 25.22, "elapsed_time": "0:15:53", "remaining_time": "0:47:07", "throughput": 5857.5, "total_tokens": 5585256} {"current_steps": 8560, "total_steps": 33920, "loss": 0.4937, "lr": 9.309659706006704e-06, "epoch": 5.047169811320755, "percentage": 25.24, "elapsed_time": "0:15:53", "remaining_time": "0:47:06", "throughput": 5857.26, "total_tokens": 5587592} {"current_steps": 8565, "total_steps": 33920, "loss": 0.3876, "lr": 9.308354707784925e-06, "epoch": 5.050117924528302, "percentage": 25.25, "elapsed_time": "0:15:54", "remaining_time": "0:47:05", "throughput": 5857.81, "total_tokens": 5591464} {"current_steps": 8570, "total_steps": 33920, "loss": 0.4688, "lr": 9.307048568907669e-06, "epoch": 5.053066037735849, "percentage": 25.27, "elapsed_time": "0:15:55", "remaining_time": "0:47:04", "throughput": 5857.76, "total_tokens": 5594344} {"current_steps": 8575, "total_steps": 33920, "loss": 0.42, "lr": 9.30574128972074e-06, "epoch": 5.056014150943396, "percentage": 25.28, "elapsed_time": "0:15:55", "remaining_time": "0:47:04", "throughput": 5857.8, "total_tokens": 5597192} {"current_steps": 8580, "total_steps": 33920, "loss": 0.4025, "lr": 9.304432870570247e-06, "epoch": 5.058962264150943, "percentage": 25.29, "elapsed_time": "0:15:55", "remaining_time": "0:47:03", "throughput": 5857.53, "total_tokens": 5599784} {"current_steps": 8585, "total_steps": 33920, "loss": 0.4048, "lr": 9.303123311802605e-06, "epoch": 5.06191037735849, "percentage": 25.31, "elapsed_time": "0:15:56", "remaining_time": "0:47:02", "throughput": 5857.7, "total_tokens": 5602792} {"current_steps": 8590, "total_steps": 33920, "loss": 0.4445, "lr": 9.301812613764516e-06, "epoch": 5.064858490566038, "percentage": 25.32, "elapsed_time": "0:15:57", "remaining_time": "0:47:02", "throughput": 5857.69, "total_tokens": 5605896} {"current_steps": 8595, "total_steps": 33920, "loss": 0.4476, "lr": 9.300500776803001e-06, "epoch": 5.067806603773585, "percentage": 25.34, "elapsed_time": "0:15:57", "remaining_time": "0:47:01", "throughput": 5857.7, "total_tokens": 5608712} {"current_steps": 8600, "total_steps": 33920, "loss": 0.4131, "lr": 9.29918780126537e-06, "epoch": 5.070754716981132, "percentage": 25.35, "elapsed_time": "0:15:57", "remaining_time": "0:47:00", "throughput": 5857.66, "total_tokens": 5611432} {"current_steps": 8605, "total_steps": 33920, "loss": 0.4427, "lr": 9.297873687499239e-06, "epoch": 5.0737028301886795, "percentage": 25.37, "elapsed_time": "0:15:58", "remaining_time": "0:46:59", "throughput": 5857.79, "total_tokens": 5614440} {"current_steps": 8610, "total_steps": 33920, "loss": 0.3489, "lr": 9.296558435852528e-06, "epoch": 5.076650943396227, "percentage": 25.38, "elapsed_time": "0:15:58", "remaining_time": "0:46:58", "throughput": 5857.73, "total_tokens": 5617032} {"current_steps": 8615, "total_steps": 33920, "loss": 0.4595, "lr": 9.295242046673454e-06, "epoch": 5.079599056603773, "percentage": 25.4, "elapsed_time": "0:15:59", "remaining_time": "0:46:58", "throughput": 5857.87, "total_tokens": 5620072} {"current_steps": 8620, "total_steps": 33920, "loss": 0.501, "lr": 9.293924520310535e-06, "epoch": 5.0825471698113205, "percentage": 25.41, "elapsed_time": "0:15:59", "remaining_time": "0:46:57", "throughput": 5858.04, "total_tokens": 5623304} {"current_steps": 8625, "total_steps": 33920, "loss": 0.4741, "lr": 9.292605857112595e-06, "epoch": 5.085495283018868, "percentage": 25.43, "elapsed_time": "0:16:00", "remaining_time": "0:46:56", "throughput": 5858.41, "total_tokens": 5627080} {"current_steps": 8630, "total_steps": 33920, "loss": 0.4497, "lr": 9.291286057428755e-06, "epoch": 5.088443396226415, "percentage": 25.44, "elapsed_time": "0:16:01", "remaining_time": "0:46:56", "throughput": 5858.81, "total_tokens": 5630568} {"current_steps": 8635, "total_steps": 33920, "loss": 0.2771, "lr": 9.289965121608436e-06, "epoch": 5.091391509433962, "percentage": 25.46, "elapsed_time": "0:16:01", "remaining_time": "0:46:55", "throughput": 5859.12, "total_tokens": 5633864} {"current_steps": 8640, "total_steps": 33920, "loss": 0.4199, "lr": 9.288643050001362e-06, "epoch": 5.09433962264151, "percentage": 25.47, "elapsed_time": "0:16:02", "remaining_time": "0:46:54", "throughput": 5858.98, "total_tokens": 5636552} {"current_steps": 8645, "total_steps": 33920, "loss": 0.5116, "lr": 9.287319842957557e-06, "epoch": 5.097287735849057, "percentage": 25.49, "elapsed_time": "0:16:02", "remaining_time": "0:46:54", "throughput": 5858.99, "total_tokens": 5639304} {"current_steps": 8650, "total_steps": 33920, "loss": 0.4196, "lr": 9.285995500827348e-06, "epoch": 5.100235849056604, "percentage": 25.5, "elapsed_time": "0:16:02", "remaining_time": "0:46:53", "throughput": 5858.9, "total_tokens": 5641960} {"current_steps": 8655, "total_steps": 33920, "loss": 0.5389, "lr": 9.284670023961355e-06, "epoch": 5.103183962264151, "percentage": 25.52, "elapsed_time": "0:16:03", "remaining_time": "0:46:52", "throughput": 5859.45, "total_tokens": 5645928} {"current_steps": 8660, "total_steps": 33920, "loss": 0.5125, "lr": 9.28334341271051e-06, "epoch": 5.106132075471698, "percentage": 25.53, "elapsed_time": "0:16:04", "remaining_time": "0:46:52", "throughput": 5859.75, "total_tokens": 5649160} {"current_steps": 8665, "total_steps": 33920, "loss": 0.4747, "lr": 9.282015667426036e-06, "epoch": 5.109080188679245, "percentage": 25.55, "elapsed_time": "0:16:04", "remaining_time": "0:46:51", "throughput": 5859.67, "total_tokens": 5651816} {"current_steps": 8670, "total_steps": 33920, "loss": 0.5281, "lr": 9.280686788459461e-06, "epoch": 5.1120283018867925, "percentage": 25.56, "elapsed_time": "0:16:05", "remaining_time": "0:46:51", "throughput": 5860.19, "total_tokens": 5656328} {"current_steps": 8675, "total_steps": 33920, "loss": 0.4091, "lr": 9.279356776162606e-06, "epoch": 5.11497641509434, "percentage": 25.57, "elapsed_time": "0:16:05", "remaining_time": "0:46:50", "throughput": 5860.34, "total_tokens": 5660008} {"current_steps": 8680, "total_steps": 33920, "loss": 0.4998, "lr": 9.278025630887607e-06, "epoch": 5.117924528301887, "percentage": 25.59, "elapsed_time": "0:16:06", "remaining_time": "0:46:49", "throughput": 5860.26, "total_tokens": 5662696} {"current_steps": 8685, "total_steps": 33920, "loss": 0.3865, "lr": 9.27669335298688e-06, "epoch": 5.120872641509434, "percentage": 25.6, "elapsed_time": "0:16:06", "remaining_time": "0:46:49", "throughput": 5860.6, "total_tokens": 5666216} {"current_steps": 8690, "total_steps": 33920, "loss": 0.4275, "lr": 9.275359942813158e-06, "epoch": 5.123820754716981, "percentage": 25.62, "elapsed_time": "0:16:07", "remaining_time": "0:46:48", "throughput": 5860.55, "total_tokens": 5669128} {"current_steps": 8695, "total_steps": 33920, "loss": 0.4193, "lr": 9.274025400719466e-06, "epoch": 5.126768867924528, "percentage": 25.63, "elapsed_time": "0:16:07", "remaining_time": "0:46:47", "throughput": 5860.78, "total_tokens": 5672168} {"current_steps": 8700, "total_steps": 33920, "loss": 0.4861, "lr": 9.27268972705913e-06, "epoch": 5.129716981132075, "percentage": 25.65, "elapsed_time": "0:16:08", "remaining_time": "0:46:47", "throughput": 5861.08, "total_tokens": 5675528} {"current_steps": 8705, "total_steps": 33920, "loss": 0.5187, "lr": 9.271352922185772e-06, "epoch": 5.132665094339623, "percentage": 25.66, "elapsed_time": "0:16:08", "remaining_time": "0:46:46", "throughput": 5861.87, "total_tokens": 5680072} {"current_steps": 8710, "total_steps": 33920, "loss": 0.4098, "lr": 9.270014986453321e-06, "epoch": 5.13561320754717, "percentage": 25.68, "elapsed_time": "0:16:09", "remaining_time": "0:46:46", "throughput": 5862.14, "total_tokens": 5683688} {"current_steps": 8715, "total_steps": 33920, "loss": 0.5463, "lr": 9.268675920215999e-06, "epoch": 5.138561320754717, "percentage": 25.69, "elapsed_time": "0:16:10", "remaining_time": "0:46:45", "throughput": 5862.13, "total_tokens": 5686600} {"current_steps": 8720, "total_steps": 33920, "loss": 0.4909, "lr": 9.26733572382833e-06, "epoch": 5.1415094339622645, "percentage": 25.71, "elapsed_time": "0:16:10", "remaining_time": "0:46:45", "throughput": 5862.39, "total_tokens": 5690376} {"current_steps": 8725, "total_steps": 33920, "loss": 0.462, "lr": 9.265994397645137e-06, "epoch": 5.144457547169812, "percentage": 25.72, "elapsed_time": "0:16:11", "remaining_time": "0:46:44", "throughput": 5862.23, "total_tokens": 5692840} {"current_steps": 8730, "total_steps": 33920, "loss": 0.5319, "lr": 9.264651942021543e-06, "epoch": 5.147405660377358, "percentage": 25.74, "elapsed_time": "0:16:11", "remaining_time": "0:46:43", "throughput": 5862.74, "total_tokens": 5697032} {"current_steps": 8735, "total_steps": 33920, "loss": 0.4488, "lr": 9.263308357312966e-06, "epoch": 5.150353773584905, "percentage": 25.75, "elapsed_time": "0:16:12", "remaining_time": "0:46:43", "throughput": 5862.95, "total_tokens": 5700552} {"current_steps": 8740, "total_steps": 33920, "loss": 0.4837, "lr": 9.26196364387513e-06, "epoch": 5.153301886792453, "percentage": 25.77, "elapsed_time": "0:16:13", "remaining_time": "0:46:43", "throughput": 5863.6, "total_tokens": 5705288} {"current_steps": 8745, "total_steps": 33920, "loss": 0.4218, "lr": 9.26061780206405e-06, "epoch": 5.15625, "percentage": 25.78, "elapsed_time": "0:16:13", "remaining_time": "0:46:42", "throughput": 5863.47, "total_tokens": 5708008} {"current_steps": 8750, "total_steps": 33920, "loss": 0.454, "lr": 9.259270832236043e-06, "epoch": 5.159198113207547, "percentage": 25.8, "elapsed_time": "0:16:14", "remaining_time": "0:46:41", "throughput": 5863.67, "total_tokens": 5711240} {"current_steps": 8755, "total_steps": 33920, "loss": 0.481, "lr": 9.257922734747729e-06, "epoch": 5.162146226415095, "percentage": 25.81, "elapsed_time": "0:16:14", "remaining_time": "0:46:41", "throughput": 5863.75, "total_tokens": 5714312} {"current_steps": 8760, "total_steps": 33920, "loss": 0.418, "lr": 9.256573509956018e-06, "epoch": 5.165094339622642, "percentage": 25.83, "elapsed_time": "0:16:15", "remaining_time": "0:46:40", "throughput": 5863.71, "total_tokens": 5717320} {"current_steps": 8765, "total_steps": 33920, "loss": 0.425, "lr": 9.255223158218127e-06, "epoch": 5.168042452830188, "percentage": 25.84, "elapsed_time": "0:16:15", "remaining_time": "0:46:40", "throughput": 5864.4, "total_tokens": 5722088} {"current_steps": 8770, "total_steps": 33920, "loss": 0.3329, "lr": 9.253871679891566e-06, "epoch": 5.1709905660377355, "percentage": 25.85, "elapsed_time": "0:16:16", "remaining_time": "0:46:39", "throughput": 5864.47, "total_tokens": 5725256} {"current_steps": 8775, "total_steps": 33920, "loss": 0.4566, "lr": 9.252519075334143e-06, "epoch": 5.173938679245283, "percentage": 25.87, "elapsed_time": "0:16:16", "remaining_time": "0:46:39", "throughput": 5864.8, "total_tokens": 5728744} {"current_steps": 8780, "total_steps": 33920, "loss": 0.4003, "lr": 9.251165344903969e-06, "epoch": 5.17688679245283, "percentage": 25.88, "elapsed_time": "0:16:17", "remaining_time": "0:46:38", "throughput": 5864.87, "total_tokens": 5732168} {"current_steps": 8785, "total_steps": 33920, "loss": 0.5422, "lr": 9.249810488959448e-06, "epoch": 5.179834905660377, "percentage": 25.9, "elapsed_time": "0:16:17", "remaining_time": "0:46:37", "throughput": 5865.16, "total_tokens": 5735752} {"current_steps": 8790, "total_steps": 33920, "loss": 0.5083, "lr": 9.248454507859285e-06, "epoch": 5.182783018867925, "percentage": 25.91, "elapsed_time": "0:16:18", "remaining_time": "0:46:37", "throughput": 5865.35, "total_tokens": 5738856} {"current_steps": 8795, "total_steps": 33920, "loss": 0.4668, "lr": 9.247097401962482e-06, "epoch": 5.185731132075472, "percentage": 25.93, "elapsed_time": "0:16:19", "remaining_time": "0:46:36", "throughput": 5865.76, "total_tokens": 5742696} {"current_steps": 8800, "total_steps": 33920, "loss": 0.4625, "lr": 9.245739171628335e-06, "epoch": 5.188679245283019, "percentage": 25.94, "elapsed_time": "0:16:19", "remaining_time": "0:46:36", "throughput": 5865.65, "total_tokens": 5745640} {"current_steps": 8805, "total_steps": 33920, "loss": 0.4479, "lr": 9.244379817216447e-06, "epoch": 5.191627358490566, "percentage": 25.96, "elapsed_time": "0:16:20", "remaining_time": "0:46:35", "throughput": 5865.98, "total_tokens": 5749000} {"current_steps": 8810, "total_steps": 33920, "loss": 0.3377, "lr": 9.243019339086708e-06, "epoch": 5.194575471698113, "percentage": 25.97, "elapsed_time": "0:16:20", "remaining_time": "0:46:34", "throughput": 5866.44, "total_tokens": 5752808} {"current_steps": 8815, "total_steps": 33920, "loss": 0.4219, "lr": 9.241657737599313e-06, "epoch": 5.19752358490566, "percentage": 25.99, "elapsed_time": "0:16:21", "remaining_time": "0:46:34", "throughput": 5866.71, "total_tokens": 5756296} {"current_steps": 8820, "total_steps": 33920, "loss": 0.4986, "lr": 9.240295013114752e-06, "epoch": 5.2004716981132075, "percentage": 26.0, "elapsed_time": "0:16:21", "remaining_time": "0:46:33", "throughput": 5866.48, "total_tokens": 5758984} {"current_steps": 8825, "total_steps": 33920, "loss": 0.4544, "lr": 9.238931165993811e-06, "epoch": 5.203419811320755, "percentage": 26.02, "elapsed_time": "0:16:22", "remaining_time": "0:46:33", "throughput": 5866.68, "total_tokens": 5762472} {"current_steps": 8830, "total_steps": 33920, "loss": 0.5471, "lr": 9.237566196597577e-06, "epoch": 5.206367924528302, "percentage": 26.03, "elapsed_time": "0:16:22", "remaining_time": "0:46:33", "throughput": 5867.35, "total_tokens": 5767592} {"current_steps": 8835, "total_steps": 33920, "loss": 0.5388, "lr": 9.236200105287427e-06, "epoch": 5.209316037735849, "percentage": 26.05, "elapsed_time": "0:16:23", "remaining_time": "0:46:32", "throughput": 5867.45, "total_tokens": 5770792} {"current_steps": 8840, "total_steps": 33920, "loss": 0.5583, "lr": 9.234832892425042e-06, "epoch": 5.212264150943396, "percentage": 26.06, "elapsed_time": "0:16:24", "remaining_time": "0:46:31", "throughput": 5867.3, "total_tokens": 5773512} {"current_steps": 8845, "total_steps": 33920, "loss": 0.5692, "lr": 9.2334645583724e-06, "epoch": 5.215212264150943, "percentage": 26.08, "elapsed_time": "0:16:24", "remaining_time": "0:46:31", "throughput": 5867.16, "total_tokens": 5776456} {"current_steps": 8850, "total_steps": 33920, "loss": 0.4607, "lr": 9.23209510349177e-06, "epoch": 5.21816037735849, "percentage": 26.09, "elapsed_time": "0:16:25", "remaining_time": "0:46:30", "throughput": 5867.45, "total_tokens": 5779976} {"current_steps": 8855, "total_steps": 33920, "loss": 0.3879, "lr": 9.230724528145722e-06, "epoch": 5.221108490566038, "percentage": 26.11, "elapsed_time": "0:16:25", "remaining_time": "0:46:29", "throughput": 5867.03, "total_tokens": 5782376} {"current_steps": 8860, "total_steps": 33920, "loss": 0.3876, "lr": 9.229352832697122e-06, "epoch": 5.224056603773585, "percentage": 26.12, "elapsed_time": "0:16:26", "remaining_time": "0:46:29", "throughput": 5867.33, "total_tokens": 5785704} {"current_steps": 8865, "total_steps": 33920, "loss": 0.5026, "lr": 9.22798001750913e-06, "epoch": 5.227004716981132, "percentage": 26.14, "elapsed_time": "0:16:26", "remaining_time": "0:46:28", "throughput": 5867.66, "total_tokens": 5789736} {"current_steps": 8870, "total_steps": 33920, "loss": 0.2945, "lr": 9.226606082945209e-06, "epoch": 5.2299528301886795, "percentage": 26.15, "elapsed_time": "0:16:27", "remaining_time": "0:46:28", "throughput": 5867.22, "total_tokens": 5792168} {"current_steps": 8875, "total_steps": 33920, "loss": 0.4544, "lr": 9.225231029369112e-06, "epoch": 5.232900943396227, "percentage": 26.16, "elapsed_time": "0:16:27", "remaining_time": "0:46:27", "throughput": 5867.25, "total_tokens": 5795112} {"current_steps": 8880, "total_steps": 33920, "loss": 0.5022, "lr": 9.22385485714489e-06, "epoch": 5.235849056603773, "percentage": 26.18, "elapsed_time": "0:16:28", "remaining_time": "0:46:26", "throughput": 5867.46, "total_tokens": 5798216} {"current_steps": 8885, "total_steps": 33920, "loss": 0.4593, "lr": 9.222477566636889e-06, "epoch": 5.2387971698113205, "percentage": 26.19, "elapsed_time": "0:16:28", "remaining_time": "0:46:25", "throughput": 5867.51, "total_tokens": 5801448} {"current_steps": 8890, "total_steps": 33920, "loss": 0.5805, "lr": 9.221099158209757e-06, "epoch": 5.241745283018868, "percentage": 26.21, "elapsed_time": "0:16:29", "remaining_time": "0:46:25", "throughput": 5867.31, "total_tokens": 5804072} {"current_steps": 8895, "total_steps": 33920, "loss": 0.4423, "lr": 9.219719632228429e-06, "epoch": 5.244693396226415, "percentage": 26.22, "elapsed_time": "0:16:29", "remaining_time": "0:46:24", "throughput": 5867.87, "total_tokens": 5808200} {"current_steps": 8900, "total_steps": 33920, "loss": 0.3634, "lr": 9.218338989058141e-06, "epoch": 5.247641509433962, "percentage": 26.24, "elapsed_time": "0:16:30", "remaining_time": "0:46:23", "throughput": 5867.24, "total_tokens": 5810376} {"current_steps": 8905, "total_steps": 33920, "loss": 0.5097, "lr": 9.21695722906443e-06, "epoch": 5.25058962264151, "percentage": 26.25, "elapsed_time": "0:16:30", "remaining_time": "0:46:23", "throughput": 5867.46, "total_tokens": 5813448} {"current_steps": 8910, "total_steps": 33920, "loss": 0.5123, "lr": 9.215574352613115e-06, "epoch": 5.253537735849057, "percentage": 26.27, "elapsed_time": "0:16:31", "remaining_time": "0:46:22", "throughput": 5867.64, "total_tokens": 5816584} {"current_steps": 8915, "total_steps": 33920, "loss": 0.4735, "lr": 9.214190360070323e-06, "epoch": 5.256485849056604, "percentage": 26.28, "elapsed_time": "0:16:31", "remaining_time": "0:46:22", "throughput": 5867.77, "total_tokens": 5820424} {"current_steps": 8920, "total_steps": 33920, "loss": 0.3986, "lr": 9.212805251802471e-06, "epoch": 5.259433962264151, "percentage": 26.3, "elapsed_time": "0:16:32", "remaining_time": "0:46:21", "throughput": 5867.78, "total_tokens": 5823432} {"current_steps": 8925, "total_steps": 33920, "loss": 0.4713, "lr": 9.211419028176273e-06, "epoch": 5.262382075471698, "percentage": 26.31, "elapsed_time": "0:16:32", "remaining_time": "0:46:20", "throughput": 5867.83, "total_tokens": 5826568} {"current_steps": 8930, "total_steps": 33920, "loss": 0.2991, "lr": 9.210031689558738e-06, "epoch": 5.265330188679245, "percentage": 26.33, "elapsed_time": "0:16:33", "remaining_time": "0:46:20", "throughput": 5867.58, "total_tokens": 5829256} {"current_steps": 8935, "total_steps": 33920, "loss": 0.3871, "lr": 9.208643236317166e-06, "epoch": 5.2682783018867925, "percentage": 26.34, "elapsed_time": "0:16:34", "remaining_time": "0:46:19", "throughput": 5867.93, "total_tokens": 5833160} {"current_steps": 8940, "total_steps": 33920, "loss": 0.4402, "lr": 9.20725366881916e-06, "epoch": 5.27122641509434, "percentage": 26.36, "elapsed_time": "0:16:34", "remaining_time": "0:46:19", "throughput": 5868.62, "total_tokens": 5838632} {"current_steps": 8945, "total_steps": 33920, "loss": 0.3734, "lr": 9.205862987432614e-06, "epoch": 5.274174528301887, "percentage": 26.37, "elapsed_time": "0:16:35", "remaining_time": "0:46:19", "throughput": 5868.44, "total_tokens": 5841416} {"current_steps": 8950, "total_steps": 33920, "loss": 0.4547, "lr": 9.204471192525715e-06, "epoch": 5.277122641509434, "percentage": 26.39, "elapsed_time": "0:16:35", "remaining_time": "0:46:18", "throughput": 5868.34, "total_tokens": 5844296} {"current_steps": 8955, "total_steps": 33920, "loss": 0.5152, "lr": 9.203078284466949e-06, "epoch": 5.280070754716981, "percentage": 26.4, "elapsed_time": "0:16:36", "remaining_time": "0:46:18", "throughput": 5868.53, "total_tokens": 5847944} {"current_steps": 8960, "total_steps": 33920, "loss": 0.4842, "lr": 9.201684263625091e-06, "epoch": 5.283018867924528, "percentage": 26.42, "elapsed_time": "0:16:36", "remaining_time": "0:46:17", "throughput": 5868.15, "total_tokens": 5850312} {"current_steps": 8965, "total_steps": 33920, "loss": 0.4647, "lr": 9.200289130369218e-06, "epoch": 5.285966981132075, "percentage": 26.43, "elapsed_time": "0:16:37", "remaining_time": "0:46:16", "throughput": 5868.23, "total_tokens": 5853256} {"current_steps": 8970, "total_steps": 33920, "loss": 0.5796, "lr": 9.198892885068693e-06, "epoch": 5.288915094339623, "percentage": 26.44, "elapsed_time": "0:16:37", "remaining_time": "0:46:15", "throughput": 5868.28, "total_tokens": 5856360} {"current_steps": 8975, "total_steps": 33920, "loss": 0.4164, "lr": 9.197495528093182e-06, "epoch": 5.29186320754717, "percentage": 26.46, "elapsed_time": "0:16:38", "remaining_time": "0:46:15", "throughput": 5868.18, "total_tokens": 5859304} {"current_steps": 8980, "total_steps": 33920, "loss": 0.456, "lr": 9.196097059812639e-06, "epoch": 5.294811320754717, "percentage": 26.47, "elapsed_time": "0:16:39", "remaining_time": "0:46:14", "throughput": 5868.39, "total_tokens": 5862760} {"current_steps": 8985, "total_steps": 33920, "loss": 0.4149, "lr": 9.194697480597316e-06, "epoch": 5.2977594339622645, "percentage": 26.49, "elapsed_time": "0:16:39", "remaining_time": "0:46:13", "throughput": 5868.55, "total_tokens": 5865928} {"current_steps": 8990, "total_steps": 33920, "loss": 0.4285, "lr": 9.193296790817755e-06, "epoch": 5.300707547169811, "percentage": 26.5, "elapsed_time": "0:16:40", "remaining_time": "0:46:13", "throughput": 5868.23, "total_tokens": 5868296} {"current_steps": 8995, "total_steps": 33920, "loss": 0.3426, "lr": 9.1918949908448e-06, "epoch": 5.303655660377358, "percentage": 26.52, "elapsed_time": "0:16:40", "remaining_time": "0:46:12", "throughput": 5868.4, "total_tokens": 5871976} {"current_steps": 9000, "total_steps": 33920, "loss": 0.3078, "lr": 9.190492081049578e-06, "epoch": 5.306603773584905, "percentage": 26.53, "elapsed_time": "0:16:41", "remaining_time": "0:46:12", "throughput": 5868.89, "total_tokens": 5875880} {"current_steps": 9005, "total_steps": 33920, "loss": 0.3029, "lr": 9.189088061803517e-06, "epoch": 5.309551886792453, "percentage": 26.55, "elapsed_time": "0:16:41", "remaining_time": "0:46:11", "throughput": 5868.88, "total_tokens": 5878696} {"current_steps": 9010, "total_steps": 33920, "loss": 0.5204, "lr": 9.187682933478337e-06, "epoch": 5.3125, "percentage": 26.56, "elapsed_time": "0:16:42", "remaining_time": "0:46:10", "throughput": 5869.0, "total_tokens": 5881640} {"current_steps": 9015, "total_steps": 33920, "loss": 0.4113, "lr": 9.186276696446054e-06, "epoch": 5.315448113207547, "percentage": 26.58, "elapsed_time": "0:16:42", "remaining_time": "0:46:09", "throughput": 5868.86, "total_tokens": 5884264} {"current_steps": 9020, "total_steps": 33920, "loss": 0.4451, "lr": 9.184869351078974e-06, "epoch": 5.318396226415095, "percentage": 26.59, "elapsed_time": "0:16:43", "remaining_time": "0:46:09", "throughput": 5869.14, "total_tokens": 5888072} {"current_steps": 9025, "total_steps": 33920, "loss": 0.3669, "lr": 9.183460897749697e-06, "epoch": 5.321344339622642, "percentage": 26.61, "elapsed_time": "0:16:43", "remaining_time": "0:46:08", "throughput": 5869.59, "total_tokens": 5891688} {"current_steps": 9030, "total_steps": 33920, "loss": 0.398, "lr": 9.182051336831117e-06, "epoch": 5.324292452830189, "percentage": 26.62, "elapsed_time": "0:16:44", "remaining_time": "0:46:08", "throughput": 5869.33, "total_tokens": 5894280} {"current_steps": 9035, "total_steps": 33920, "loss": 0.3878, "lr": 9.180640668696424e-06, "epoch": 5.3272405660377355, "percentage": 26.64, "elapsed_time": "0:16:44", "remaining_time": "0:46:07", "throughput": 5869.58, "total_tokens": 5897672} {"current_steps": 9040, "total_steps": 33920, "loss": 0.5118, "lr": 9.179228893719094e-06, "epoch": 5.330188679245283, "percentage": 26.65, "elapsed_time": "0:16:45", "remaining_time": "0:46:06", "throughput": 5869.45, "total_tokens": 5900328} {"current_steps": 9045, "total_steps": 33920, "loss": 0.4041, "lr": 9.177816012272904e-06, "epoch": 5.33313679245283, "percentage": 26.67, "elapsed_time": "0:16:45", "remaining_time": "0:46:05", "throughput": 5869.44, "total_tokens": 5903016} {"current_steps": 9050, "total_steps": 33920, "loss": 0.589, "lr": 9.17640202473192e-06, "epoch": 5.336084905660377, "percentage": 26.68, "elapsed_time": "0:16:46", "remaining_time": "0:46:05", "throughput": 5869.39, "total_tokens": 5905864} {"current_steps": 9055, "total_steps": 33920, "loss": 0.4051, "lr": 9.1749869314705e-06, "epoch": 5.339033018867925, "percentage": 26.7, "elapsed_time": "0:16:46", "remaining_time": "0:46:04", "throughput": 5869.44, "total_tokens": 5908904} {"current_steps": 9060, "total_steps": 33920, "loss": 0.5738, "lr": 9.173570732863295e-06, "epoch": 5.341981132075472, "percentage": 26.71, "elapsed_time": "0:16:47", "remaining_time": "0:46:03", "throughput": 5869.65, "total_tokens": 5912552} {"current_steps": 9065, "total_steps": 33920, "loss": 0.5138, "lr": 9.172153429285254e-06, "epoch": 5.344929245283019, "percentage": 26.72, "elapsed_time": "0:16:47", "remaining_time": "0:46:03", "throughput": 5869.32, "total_tokens": 5914888} {"current_steps": 9070, "total_steps": 33920, "loss": 0.5569, "lr": 9.17073502111161e-06, "epoch": 5.347877358490566, "percentage": 26.74, "elapsed_time": "0:16:48", "remaining_time": "0:46:02", "throughput": 5869.11, "total_tokens": 5917480} {"current_steps": 9075, "total_steps": 33920, "loss": 0.431, "lr": 9.169315508717895e-06, "epoch": 5.350825471698113, "percentage": 26.75, "elapsed_time": "0:16:48", "remaining_time": "0:46:01", "throughput": 5868.53, "total_tokens": 5919944} {"current_steps": 9080, "total_steps": 33920, "loss": 0.4494, "lr": 9.167894892479932e-06, "epoch": 5.35377358490566, "percentage": 26.77, "elapsed_time": "0:16:49", "remaining_time": "0:46:01", "throughput": 5868.88, "total_tokens": 5923240} {"current_steps": 9085, "total_steps": 33920, "loss": 0.4871, "lr": 9.16647317277383e-06, "epoch": 5.3567216981132075, "percentage": 26.78, "elapsed_time": "0:16:49", "remaining_time": "0:46:00", "throughput": 5869.01, "total_tokens": 5926344} {"current_steps": 9090, "total_steps": 33920, "loss": 0.4199, "lr": 9.165050349976002e-06, "epoch": 5.359669811320755, "percentage": 26.8, "elapsed_time": "0:16:50", "remaining_time": "0:45:59", "throughput": 5868.59, "total_tokens": 5929224} {"current_steps": 9095, "total_steps": 33920, "loss": 0.4641, "lr": 9.16362642446314e-06, "epoch": 5.362617924528302, "percentage": 26.81, "elapsed_time": "0:16:50", "remaining_time": "0:45:59", "throughput": 5868.89, "total_tokens": 5933096} {"current_steps": 9100, "total_steps": 33920, "loss": 0.449, "lr": 9.162201396612242e-06, "epoch": 5.365566037735849, "percentage": 26.83, "elapsed_time": "0:16:51", "remaining_time": "0:45:58", "throughput": 5869.13, "total_tokens": 5936712} {"current_steps": 9105, "total_steps": 33920, "loss": 0.6339, "lr": 9.160775266800583e-06, "epoch": 5.368514150943396, "percentage": 26.84, "elapsed_time": "0:16:52", "remaining_time": "0:45:58", "throughput": 5868.92, "total_tokens": 5939368} {"current_steps": 9110, "total_steps": 33920, "loss": 0.4358, "lr": 9.159348035405742e-06, "epoch": 5.371462264150943, "percentage": 26.86, "elapsed_time": "0:16:52", "remaining_time": "0:45:57", "throughput": 5868.88, "total_tokens": 5942408} {"current_steps": 9115, "total_steps": 33920, "loss": 0.4323, "lr": 9.157919702805582e-06, "epoch": 5.37441037735849, "percentage": 26.87, "elapsed_time": "0:16:53", "remaining_time": "0:45:56", "throughput": 5869.02, "total_tokens": 5945480} {"current_steps": 9120, "total_steps": 33920, "loss": 0.3451, "lr": 9.156490269378262e-06, "epoch": 5.377358490566038, "percentage": 26.89, "elapsed_time": "0:16:53", "remaining_time": "0:45:56", "throughput": 5869.1, "total_tokens": 5948872} {"current_steps": 9125, "total_steps": 33920, "loss": 0.5244, "lr": 9.15505973550223e-06, "epoch": 5.380306603773585, "percentage": 26.9, "elapsed_time": "0:16:54", "remaining_time": "0:45:55", "throughput": 5869.41, "total_tokens": 5952328} {"current_steps": 9130, "total_steps": 33920, "loss": 0.4124, "lr": 9.153628101556223e-06, "epoch": 5.383254716981132, "percentage": 26.92, "elapsed_time": "0:16:54", "remaining_time": "0:45:55", "throughput": 5869.64, "total_tokens": 5955720} {"current_steps": 9135, "total_steps": 33920, "loss": 0.4264, "lr": 9.152195367919277e-06, "epoch": 5.3862028301886795, "percentage": 26.93, "elapsed_time": "0:16:55", "remaining_time": "0:45:54", "throughput": 5869.33, "total_tokens": 5958376} {"current_steps": 9140, "total_steps": 33920, "loss": 0.3861, "lr": 9.150761534970713e-06, "epoch": 5.389150943396227, "percentage": 26.95, "elapsed_time": "0:16:55", "remaining_time": "0:45:53", "throughput": 5869.0, "total_tokens": 5961096} {"current_steps": 9145, "total_steps": 33920, "loss": 0.4391, "lr": 9.149326603090144e-06, "epoch": 5.392099056603773, "percentage": 26.96, "elapsed_time": "0:16:56", "remaining_time": "0:45:52", "throughput": 5869.0, "total_tokens": 5963944} {"current_steps": 9150, "total_steps": 33920, "loss": 0.4189, "lr": 9.147890572657471e-06, "epoch": 5.3950471698113205, "percentage": 26.98, "elapsed_time": "0:16:56", "remaining_time": "0:45:52", "throughput": 5868.85, "total_tokens": 5966696} {"current_steps": 9155, "total_steps": 33920, "loss": 0.6397, "lr": 9.146453444052895e-06, "epoch": 5.397995283018868, "percentage": 26.99, "elapsed_time": "0:16:57", "remaining_time": "0:45:51", "throughput": 5868.89, "total_tokens": 5969864} {"current_steps": 9160, "total_steps": 33920, "loss": 0.5828, "lr": 9.145015217656899e-06, "epoch": 5.400943396226415, "percentage": 27.0, "elapsed_time": "0:16:57", "remaining_time": "0:45:50", "throughput": 5869.02, "total_tokens": 5972840} {"current_steps": 9165, "total_steps": 33920, "loss": 0.5123, "lr": 9.14357589385026e-06, "epoch": 5.403891509433962, "percentage": 27.02, "elapsed_time": "0:16:58", "remaining_time": "0:45:50", "throughput": 5868.82, "total_tokens": 5975464} {"current_steps": 9170, "total_steps": 33920, "loss": 0.4051, "lr": 9.142135473014046e-06, "epoch": 5.40683962264151, "percentage": 27.03, "elapsed_time": "0:16:58", "remaining_time": "0:45:49", "throughput": 5869.03, "total_tokens": 5978792} {"current_steps": 9175, "total_steps": 33920, "loss": 0.3788, "lr": 9.140693955529614e-06, "epoch": 5.409787735849057, "percentage": 27.05, "elapsed_time": "0:16:59", "remaining_time": "0:45:48", "throughput": 5869.09, "total_tokens": 5981672} {"current_steps": 9180, "total_steps": 33920, "loss": 0.2851, "lr": 9.13925134177861e-06, "epoch": 5.412735849056604, "percentage": 27.06, "elapsed_time": "0:17:00", "remaining_time": "0:45:49", "throughput": 5869.91, "total_tokens": 5987752} {"current_steps": 9185, "total_steps": 33920, "loss": 0.3544, "lr": 9.137807632142977e-06, "epoch": 5.415683962264151, "percentage": 27.08, "elapsed_time": "0:17:00", "remaining_time": "0:45:48", "throughput": 5869.87, "total_tokens": 5990408} {"current_steps": 9190, "total_steps": 33920, "loss": 0.4482, "lr": 9.136362827004937e-06, "epoch": 5.418632075471698, "percentage": 27.09, "elapsed_time": "0:17:01", "remaining_time": "0:45:47", "throughput": 5870.03, "total_tokens": 5993704} {"current_steps": 9195, "total_steps": 33920, "loss": 0.3738, "lr": 9.134916926747015e-06, "epoch": 5.421580188679245, "percentage": 27.11, "elapsed_time": "0:17:01", "remaining_time": "0:45:47", "throughput": 5870.13, "total_tokens": 5997416} {"current_steps": 9200, "total_steps": 33920, "loss": 0.5928, "lr": 9.133469931752016e-06, "epoch": 5.4245283018867925, "percentage": 27.12, "elapsed_time": "0:17:02", "remaining_time": "0:45:46", "throughput": 5870.16, "total_tokens": 6000584} {"current_steps": 9205, "total_steps": 33920, "loss": 0.3036, "lr": 9.132021842403035e-06, "epoch": 5.42747641509434, "percentage": 27.14, "elapsed_time": "0:17:02", "remaining_time": "0:45:45", "throughput": 5869.82, "total_tokens": 6003080} {"current_steps": 9210, "total_steps": 33920, "loss": 0.4712, "lr": 9.130572659083465e-06, "epoch": 5.430424528301887, "percentage": 27.15, "elapsed_time": "0:17:03", "remaining_time": "0:45:45", "throughput": 5870.09, "total_tokens": 6006472} {"current_steps": 9215, "total_steps": 33920, "loss": 0.4492, "lr": 9.129122382176982e-06, "epoch": 5.433372641509434, "percentage": 27.17, "elapsed_time": "0:17:03", "remaining_time": "0:45:44", "throughput": 5870.56, "total_tokens": 6010440} {"current_steps": 9220, "total_steps": 33920, "loss": 0.4778, "lr": 9.127671012067554e-06, "epoch": 5.436320754716981, "percentage": 27.18, "elapsed_time": "0:17:04", "remaining_time": "0:45:44", "throughput": 5870.5, "total_tokens": 6013256} {"current_steps": 9225, "total_steps": 33920, "loss": 0.4007, "lr": 9.126218549139434e-06, "epoch": 5.439268867924528, "percentage": 27.2, "elapsed_time": "0:17:04", "remaining_time": "0:45:43", "throughput": 5871.0, "total_tokens": 6017192} {"current_steps": 9230, "total_steps": 33920, "loss": 0.3953, "lr": 9.124764993777171e-06, "epoch": 5.442216981132075, "percentage": 27.21, "elapsed_time": "0:17:05", "remaining_time": "0:45:42", "throughput": 5871.09, "total_tokens": 6020264} {"current_steps": 9235, "total_steps": 33920, "loss": 0.4557, "lr": 9.1233103463656e-06, "epoch": 5.445165094339623, "percentage": 27.23, "elapsed_time": "0:17:05", "remaining_time": "0:45:42", "throughput": 5871.27, "total_tokens": 6023752} {"current_steps": 9240, "total_steps": 33920, "loss": 0.3912, "lr": 9.121854607289842e-06, "epoch": 5.44811320754717, "percentage": 27.24, "elapsed_time": "0:17:06", "remaining_time": "0:45:42", "throughput": 5871.72, "total_tokens": 6028328} {"current_steps": 9245, "total_steps": 33920, "loss": 0.5873, "lr": 9.120397776935314e-06, "epoch": 5.451061320754717, "percentage": 27.26, "elapsed_time": "0:17:07", "remaining_time": "0:45:41", "throughput": 5871.74, "total_tokens": 6031272} {"current_steps": 9250, "total_steps": 33920, "loss": 0.3539, "lr": 9.118939855687717e-06, "epoch": 5.4540094339622645, "percentage": 27.27, "elapsed_time": "0:17:07", "remaining_time": "0:45:40", "throughput": 5871.95, "total_tokens": 6034472} {"current_steps": 9255, "total_steps": 33920, "loss": 0.4471, "lr": 9.117480843933043e-06, "epoch": 5.456957547169811, "percentage": 27.28, "elapsed_time": "0:17:08", "remaining_time": "0:45:40", "throughput": 5872.44, "total_tokens": 6038760} {"current_steps": 9260, "total_steps": 33920, "loss": 0.4641, "lr": 9.116020742057567e-06, "epoch": 5.459905660377358, "percentage": 27.3, "elapsed_time": "0:17:08", "remaining_time": "0:45:40", "throughput": 5872.58, "total_tokens": 6042312} {"current_steps": 9265, "total_steps": 33920, "loss": 0.5925, "lr": 9.114559550447863e-06, "epoch": 5.462853773584905, "percentage": 27.31, "elapsed_time": "0:17:09", "remaining_time": "0:45:39", "throughput": 5872.19, "total_tokens": 6044616} {"current_steps": 9270, "total_steps": 33920, "loss": 0.5181, "lr": 9.113097269490784e-06, "epoch": 5.465801886792453, "percentage": 27.33, "elapsed_time": "0:17:09", "remaining_time": "0:45:38", "throughput": 5872.58, "total_tokens": 6048424} {"current_steps": 9275, "total_steps": 33920, "loss": 0.4099, "lr": 9.111633899573476e-06, "epoch": 5.46875, "percentage": 27.34, "elapsed_time": "0:17:10", "remaining_time": "0:45:38", "throughput": 5872.31, "total_tokens": 6051016} {"current_steps": 9280, "total_steps": 33920, "loss": 0.5384, "lr": 9.110169441083374e-06, "epoch": 5.471698113207547, "percentage": 27.36, "elapsed_time": "0:17:10", "remaining_time": "0:45:37", "throughput": 5872.57, "total_tokens": 6054280} {"current_steps": 9285, "total_steps": 33920, "loss": 0.3662, "lr": 9.108703894408198e-06, "epoch": 5.474646226415095, "percentage": 27.37, "elapsed_time": "0:17:11", "remaining_time": "0:45:36", "throughput": 5872.41, "total_tokens": 6057128} {"current_steps": 9290, "total_steps": 33920, "loss": 0.4008, "lr": 9.107237259935959e-06, "epoch": 5.477594339622642, "percentage": 27.39, "elapsed_time": "0:17:11", "remaining_time": "0:45:35", "throughput": 5872.62, "total_tokens": 6060360} {"current_steps": 9295, "total_steps": 33920, "loss": 0.4012, "lr": 9.105769538054954e-06, "epoch": 5.480542452830189, "percentage": 27.4, "elapsed_time": "0:17:12", "remaining_time": "0:45:35", "throughput": 5872.68, "total_tokens": 6063976} {"current_steps": 9300, "total_steps": 33920, "loss": 0.4109, "lr": 9.104300729153768e-06, "epoch": 5.4834905660377355, "percentage": 27.42, "elapsed_time": "0:17:13", "remaining_time": "0:45:35", "throughput": 5873.38, "total_tokens": 6068488} {"current_steps": 9305, "total_steps": 33920, "loss": 0.4521, "lr": 9.102830833621277e-06, "epoch": 5.486438679245283, "percentage": 27.43, "elapsed_time": "0:17:13", "remaining_time": "0:45:34", "throughput": 5873.73, "total_tokens": 6071944} {"current_steps": 9310, "total_steps": 33920, "loss": 0.4442, "lr": 9.101359851846639e-06, "epoch": 5.48938679245283, "percentage": 27.45, "elapsed_time": "0:17:14", "remaining_time": "0:45:33", "throughput": 5873.81, "total_tokens": 6075144} {"current_steps": 9315, "total_steps": 33920, "loss": 0.5017, "lr": 9.099887784219305e-06, "epoch": 5.492334905660377, "percentage": 27.46, "elapsed_time": "0:17:14", "remaining_time": "0:45:33", "throughput": 5873.88, "total_tokens": 6078952} {"current_steps": 9320, "total_steps": 33920, "loss": 0.3857, "lr": 9.098414631129012e-06, "epoch": 5.495283018867925, "percentage": 27.48, "elapsed_time": "0:17:15", "remaining_time": "0:45:32", "throughput": 5873.8, "total_tokens": 6081736} {"current_steps": 9325, "total_steps": 33920, "loss": 0.3306, "lr": 9.09694039296578e-06, "epoch": 5.498231132075472, "percentage": 27.49, "elapsed_time": "0:17:15", "remaining_time": "0:45:32", "throughput": 5874.08, "total_tokens": 6085128} {"current_steps": 9330, "total_steps": 33920, "loss": 0.5741, "lr": 9.095465070119924e-06, "epoch": 5.501179245283019, "percentage": 27.51, "elapsed_time": "0:17:16", "remaining_time": "0:45:31", "throughput": 5874.37, "total_tokens": 6088680} {"current_steps": 9335, "total_steps": 33920, "loss": 0.6311, "lr": 9.09398866298204e-06, "epoch": 5.504127358490566, "percentage": 27.52, "elapsed_time": "0:17:17", "remaining_time": "0:45:31", "throughput": 5874.45, "total_tokens": 6091880} {"current_steps": 9340, "total_steps": 33920, "loss": 0.424, "lr": 9.09251117194301e-06, "epoch": 5.507075471698113, "percentage": 27.54, "elapsed_time": "0:17:17", "remaining_time": "0:45:30", "throughput": 5874.91, "total_tokens": 6095752} {"current_steps": 9345, "total_steps": 33920, "loss": 0.4407, "lr": 9.091032597394012e-06, "epoch": 5.51002358490566, "percentage": 27.55, "elapsed_time": "0:17:18", "remaining_time": "0:45:30", "throughput": 5875.17, "total_tokens": 6099176} {"current_steps": 9350, "total_steps": 33920, "loss": 0.4979, "lr": 9.089552939726503e-06, "epoch": 5.5129716981132075, "percentage": 27.56, "elapsed_time": "0:17:18", "remaining_time": "0:45:29", "throughput": 5875.3, "total_tokens": 6102152} {"current_steps": 9355, "total_steps": 33920, "loss": 0.5228, "lr": 9.088072199332227e-06, "epoch": 5.515919811320755, "percentage": 27.58, "elapsed_time": "0:17:19", "remaining_time": "0:45:28", "throughput": 5875.31, "total_tokens": 6105256} {"current_steps": 9360, "total_steps": 33920, "loss": 0.4303, "lr": 9.08659037660322e-06, "epoch": 5.518867924528302, "percentage": 27.59, "elapsed_time": "0:17:19", "remaining_time": "0:45:28", "throughput": 5875.17, "total_tokens": 6108488} {"current_steps": 9365, "total_steps": 33920, "loss": 0.385, "lr": 9.085107471931797e-06, "epoch": 5.521816037735849, "percentage": 27.61, "elapsed_time": "0:17:20", "remaining_time": "0:45:27", "throughput": 5875.75, "total_tokens": 6113256} {"current_steps": 9370, "total_steps": 33920, "loss": 0.4151, "lr": 9.083623485710564e-06, "epoch": 5.524764150943396, "percentage": 27.62, "elapsed_time": "0:17:20", "remaining_time": "0:45:27", "throughput": 5875.5, "total_tokens": 6115848} {"current_steps": 9375, "total_steps": 33920, "loss": 0.4596, "lr": 9.082138418332416e-06, "epoch": 5.527712264150943, "percentage": 27.64, "elapsed_time": "0:17:21", "remaining_time": "0:45:26", "throughput": 5875.1, "total_tokens": 6118216} {"current_steps": 9380, "total_steps": 33920, "loss": 0.3994, "lr": 9.080652270190527e-06, "epoch": 5.53066037735849, "percentage": 27.65, "elapsed_time": "0:17:21", "remaining_time": "0:45:25", "throughput": 5874.63, "total_tokens": 6120520} {"current_steps": 9385, "total_steps": 33920, "loss": 0.3377, "lr": 9.079165041678363e-06, "epoch": 5.533608490566038, "percentage": 27.67, "elapsed_time": "0:17:22", "remaining_time": "0:45:25", "throughput": 5874.92, "total_tokens": 6123880} {"current_steps": 9390, "total_steps": 33920, "loss": 0.4339, "lr": 9.077676733189675e-06, "epoch": 5.536556603773585, "percentage": 27.68, "elapsed_time": "0:17:22", "remaining_time": "0:45:24", "throughput": 5875.29, "total_tokens": 6127528} {"current_steps": 9395, "total_steps": 33920, "loss": 0.3373, "lr": 9.076187345118496e-06, "epoch": 5.539504716981132, "percentage": 27.7, "elapsed_time": "0:17:23", "remaining_time": "0:45:23", "throughput": 5874.97, "total_tokens": 6129864} {"current_steps": 9400, "total_steps": 33920, "loss": 0.5797, "lr": 9.074696877859152e-06, "epoch": 5.5424528301886795, "percentage": 27.71, "elapsed_time": "0:17:23", "remaining_time": "0:45:23", "throughput": 5875.32, "total_tokens": 6133704} {"current_steps": 9405, "total_steps": 33920, "loss": 0.3739, "lr": 9.073205331806248e-06, "epoch": 5.545400943396227, "percentage": 27.73, "elapsed_time": "0:17:24", "remaining_time": "0:45:22", "throughput": 5875.55, "total_tokens": 6136968} {"current_steps": 9410, "total_steps": 33920, "loss": 0.3247, "lr": 9.071712707354676e-06, "epoch": 5.548349056603773, "percentage": 27.74, "elapsed_time": "0:17:24", "remaining_time": "0:45:21", "throughput": 5875.62, "total_tokens": 6139880} {"current_steps": 9415, "total_steps": 33920, "loss": 0.5753, "lr": 9.070219004899618e-06, "epoch": 5.5512971698113205, "percentage": 27.76, "elapsed_time": "0:17:25", "remaining_time": "0:45:21", "throughput": 5875.92, "total_tokens": 6143112} {"current_steps": 9420, "total_steps": 33920, "loss": 0.3399, "lr": 9.068724224836538e-06, "epoch": 5.554245283018868, "percentage": 27.77, "elapsed_time": "0:17:26", "remaining_time": "0:45:20", "throughput": 5876.34, "total_tokens": 6146728} {"current_steps": 9425, "total_steps": 33920, "loss": 0.3981, "lr": 9.067228367561182e-06, "epoch": 5.557193396226415, "percentage": 27.79, "elapsed_time": "0:17:26", "remaining_time": "0:45:19", "throughput": 5876.11, "total_tokens": 6149192} {"current_steps": 9430, "total_steps": 33920, "loss": 0.5887, "lr": 9.06573143346959e-06, "epoch": 5.560141509433962, "percentage": 27.8, "elapsed_time": "0:17:27", "remaining_time": "0:45:20", "throughput": 5876.86, "total_tokens": 6155560} {"current_steps": 9435, "total_steps": 33920, "loss": 0.4602, "lr": 9.064233422958078e-06, "epoch": 5.56308962264151, "percentage": 27.82, "elapsed_time": "0:17:27", "remaining_time": "0:45:19", "throughput": 5877.21, "total_tokens": 6159080} {"current_steps": 9440, "total_steps": 33920, "loss": 0.4605, "lr": 9.062734336423248e-06, "epoch": 5.566037735849057, "percentage": 27.83, "elapsed_time": "0:17:28", "remaining_time": "0:45:19", "throughput": 5877.47, "total_tokens": 6162632} {"current_steps": 9445, "total_steps": 33920, "loss": 0.7057, "lr": 9.061234174261998e-06, "epoch": 5.568985849056604, "percentage": 27.84, "elapsed_time": "0:17:29", "remaining_time": "0:45:18", "throughput": 5877.6, "total_tokens": 6165928} {"current_steps": 9450, "total_steps": 33920, "loss": 0.459, "lr": 9.059732936871493e-06, "epoch": 5.571933962264151, "percentage": 27.86, "elapsed_time": "0:17:29", "remaining_time": "0:45:17", "throughput": 5877.38, "total_tokens": 6168680} {"current_steps": 9455, "total_steps": 33920, "loss": 0.5412, "lr": 9.058230624649198e-06, "epoch": 5.574882075471698, "percentage": 27.87, "elapsed_time": "0:17:30", "remaining_time": "0:45:17", "throughput": 5877.34, "total_tokens": 6171720} {"current_steps": 9460, "total_steps": 33920, "loss": 0.357, "lr": 9.056727237992856e-06, "epoch": 5.577830188679245, "percentage": 27.89, "elapsed_time": "0:17:30", "remaining_time": "0:45:16", "throughput": 5877.59, "total_tokens": 6175688} {"current_steps": 9465, "total_steps": 33920, "loss": 0.4673, "lr": 9.055222777300493e-06, "epoch": 5.5807783018867925, "percentage": 27.9, "elapsed_time": "0:17:31", "remaining_time": "0:45:16", "throughput": 5877.74, "total_tokens": 6178984} {"current_steps": 9470, "total_steps": 33920, "loss": 0.4402, "lr": 9.053717242970423e-06, "epoch": 5.58372641509434, "percentage": 27.92, "elapsed_time": "0:17:31", "remaining_time": "0:45:15", "throughput": 5877.95, "total_tokens": 6182184} {"current_steps": 9475, "total_steps": 33920, "loss": 0.7418, "lr": 9.052210635401244e-06, "epoch": 5.586674528301887, "percentage": 27.93, "elapsed_time": "0:17:32", "remaining_time": "0:45:14", "throughput": 5877.73, "total_tokens": 6184776} {"current_steps": 9480, "total_steps": 33920, "loss": 0.4825, "lr": 9.050702954991833e-06, "epoch": 5.589622641509434, "percentage": 27.95, "elapsed_time": "0:17:32", "remaining_time": "0:45:13", "throughput": 5877.64, "total_tokens": 6187528} {"current_steps": 9485, "total_steps": 33920, "loss": 0.448, "lr": 9.049194202141358e-06, "epoch": 5.592570754716981, "percentage": 27.96, "elapsed_time": "0:17:33", "remaining_time": "0:45:13", "throughput": 5877.56, "total_tokens": 6190472} {"current_steps": 9490, "total_steps": 33920, "loss": 0.453, "lr": 9.047684377249267e-06, "epoch": 5.595518867924528, "percentage": 27.98, "elapsed_time": "0:17:33", "remaining_time": "0:45:12", "throughput": 5877.27, "total_tokens": 6193192} {"current_steps": 9495, "total_steps": 33920, "loss": 0.5519, "lr": 9.046173480715292e-06, "epoch": 5.598466981132075, "percentage": 27.99, "elapsed_time": "0:17:34", "remaining_time": "0:45:11", "throughput": 5877.35, "total_tokens": 6196200} {"current_steps": 9500, "total_steps": 33920, "loss": 0.3322, "lr": 9.044661512939451e-06, "epoch": 5.601415094339623, "percentage": 28.01, "elapsed_time": "0:17:34", "remaining_time": "0:45:11", "throughput": 5877.12, "total_tokens": 6198856} {"current_steps": 9505, "total_steps": 33920, "loss": 0.6234, "lr": 9.043148474322043e-06, "epoch": 5.60436320754717, "percentage": 28.02, "elapsed_time": "0:17:35", "remaining_time": "0:45:10", "throughput": 5877.17, "total_tokens": 6202024} {"current_steps": 9510, "total_steps": 33920, "loss": 0.5384, "lr": 9.04163436526365e-06, "epoch": 5.607311320754717, "percentage": 28.04, "elapsed_time": "0:17:35", "remaining_time": "0:45:10", "throughput": 5877.27, "total_tokens": 6205352} {"current_steps": 9515, "total_steps": 33920, "loss": 0.4535, "lr": 9.040119186165142e-06, "epoch": 5.6102594339622645, "percentage": 28.05, "elapsed_time": "0:17:36", "remaining_time": "0:45:09", "throughput": 5877.08, "total_tokens": 6207848} {"current_steps": 9520, "total_steps": 33920, "loss": 0.3904, "lr": 9.038602937427665e-06, "epoch": 5.613207547169811, "percentage": 28.07, "elapsed_time": "0:17:36", "remaining_time": "0:45:08", "throughput": 5877.15, "total_tokens": 6210920} {"current_steps": 9525, "total_steps": 33920, "loss": 0.6985, "lr": 9.037085619452658e-06, "epoch": 5.616155660377358, "percentage": 28.08, "elapsed_time": "0:17:37", "remaining_time": "0:45:08", "throughput": 5877.8, "total_tokens": 6215432} {"current_steps": 9530, "total_steps": 33920, "loss": 0.3224, "lr": 9.035567232641833e-06, "epoch": 5.619103773584905, "percentage": 28.1, "elapsed_time": "0:17:37", "remaining_time": "0:45:07", "throughput": 5877.96, "total_tokens": 6218760} {"current_steps": 9535, "total_steps": 33920, "loss": 0.4155, "lr": 9.03404777739719e-06, "epoch": 5.622051886792453, "percentage": 28.11, "elapsed_time": "0:17:38", "remaining_time": "0:45:07", "throughput": 5878.42, "total_tokens": 6222952} {"current_steps": 9540, "total_steps": 33920, "loss": 0.4727, "lr": 9.032527254121013e-06, "epoch": 5.625, "percentage": 28.12, "elapsed_time": "0:17:39", "remaining_time": "0:45:06", "throughput": 5878.73, "total_tokens": 6226376} {"current_steps": 9545, "total_steps": 33920, "loss": 0.3267, "lr": 9.031005663215867e-06, "epoch": 5.627948113207547, "percentage": 28.14, "elapsed_time": "0:17:39", "remaining_time": "0:45:05", "throughput": 5878.9, "total_tokens": 6229448} {"current_steps": 9550, "total_steps": 33920, "loss": 0.4122, "lr": 9.029483005084595e-06, "epoch": 5.630896226415095, "percentage": 28.15, "elapsed_time": "0:17:40", "remaining_time": "0:45:05", "throughput": 5879.23, "total_tokens": 6233224} {"current_steps": 9555, "total_steps": 33920, "loss": 0.4086, "lr": 9.027959280130337e-06, "epoch": 5.633844339622642, "percentage": 28.17, "elapsed_time": "0:17:40", "remaining_time": "0:45:04", "throughput": 5879.45, "total_tokens": 6236392} {"current_steps": 9560, "total_steps": 33920, "loss": 0.469, "lr": 9.026434488756496e-06, "epoch": 5.636792452830189, "percentage": 28.18, "elapsed_time": "0:17:41", "remaining_time": "0:45:04", "throughput": 5879.38, "total_tokens": 6239112} {"current_steps": 9565, "total_steps": 33920, "loss": 0.518, "lr": 9.024908631366774e-06, "epoch": 5.6397405660377355, "percentage": 28.2, "elapsed_time": "0:17:41", "remaining_time": "0:45:03", "throughput": 5879.78, "total_tokens": 6242568} {"current_steps": 9570, "total_steps": 33920, "loss": 0.406, "lr": 9.023381708365143e-06, "epoch": 5.642688679245283, "percentage": 28.21, "elapsed_time": "0:17:42", "remaining_time": "0:45:02", "throughput": 5879.87, "total_tokens": 6245640} {"current_steps": 9575, "total_steps": 33920, "loss": 0.3532, "lr": 9.021853720155866e-06, "epoch": 5.64563679245283, "percentage": 28.23, "elapsed_time": "0:17:42", "remaining_time": "0:45:02", "throughput": 5879.98, "total_tokens": 6248744} {"current_steps": 9580, "total_steps": 33920, "loss": 0.5186, "lr": 9.020324667143483e-06, "epoch": 5.648584905660377, "percentage": 28.24, "elapsed_time": "0:17:43", "remaining_time": "0:45:01", "throughput": 5880.07, "total_tokens": 6251624} {"current_steps": 9585, "total_steps": 33920, "loss": 0.367, "lr": 9.018794549732819e-06, "epoch": 5.651533018867925, "percentage": 28.26, "elapsed_time": "0:17:43", "remaining_time": "0:45:00", "throughput": 5880.22, "total_tokens": 6254664} {"current_steps": 9590, "total_steps": 33920, "loss": 0.4848, "lr": 9.017263368328977e-06, "epoch": 5.654481132075472, "percentage": 28.27, "elapsed_time": "0:17:44", "remaining_time": "0:44:59", "throughput": 5880.43, "total_tokens": 6257928} {"current_steps": 9595, "total_steps": 33920, "loss": 0.4894, "lr": 9.015731123337344e-06, "epoch": 5.657429245283019, "percentage": 28.29, "elapsed_time": "0:17:44", "remaining_time": "0:44:59", "throughput": 5880.63, "total_tokens": 6261416} {"current_steps": 9600, "total_steps": 33920, "loss": 0.3968, "lr": 9.01419781516359e-06, "epoch": 5.660377358490566, "percentage": 28.3, "elapsed_time": "0:17:45", "remaining_time": "0:44:58", "throughput": 5880.83, "total_tokens": 6264520} {"current_steps": 9605, "total_steps": 33920, "loss": 0.4933, "lr": 9.012663444213664e-06, "epoch": 5.663325471698113, "percentage": 28.32, "elapsed_time": "0:17:45", "remaining_time": "0:44:57", "throughput": 5881.16, "total_tokens": 6267944} {"current_steps": 9610, "total_steps": 33920, "loss": 0.4628, "lr": 9.011128010893797e-06, "epoch": 5.66627358490566, "percentage": 28.33, "elapsed_time": "0:17:46", "remaining_time": "0:44:57", "throughput": 5881.36, "total_tokens": 6271208} {"current_steps": 9615, "total_steps": 33920, "loss": 0.4661, "lr": 9.009591515610503e-06, "epoch": 5.6692216981132075, "percentage": 28.35, "elapsed_time": "0:17:46", "remaining_time": "0:44:56", "throughput": 5881.47, "total_tokens": 6274312} {"current_steps": 9620, "total_steps": 33920, "loss": 0.4437, "lr": 9.008053958770575e-06, "epoch": 5.672169811320755, "percentage": 28.36, "elapsed_time": "0:17:47", "remaining_time": "0:44:55", "throughput": 5881.51, "total_tokens": 6277256} {"current_steps": 9625, "total_steps": 33920, "loss": 0.4205, "lr": 9.006515340781087e-06, "epoch": 5.675117924528302, "percentage": 28.38, "elapsed_time": "0:17:47", "remaining_time": "0:44:55", "throughput": 5881.82, "total_tokens": 6280712} {"current_steps": 9630, "total_steps": 33920, "loss": 0.3217, "lr": 9.004975662049396e-06, "epoch": 5.678066037735849, "percentage": 28.39, "elapsed_time": "0:17:48", "remaining_time": "0:44:54", "throughput": 5882.03, "total_tokens": 6283816} {"current_steps": 9635, "total_steps": 33920, "loss": 0.4349, "lr": 9.003434922983138e-06, "epoch": 5.681014150943396, "percentage": 28.41, "elapsed_time": "0:17:48", "remaining_time": "0:44:53", "throughput": 5881.87, "total_tokens": 6286248} {"current_steps": 9640, "total_steps": 33920, "loss": 0.4269, "lr": 9.00189312399023e-06, "epoch": 5.683962264150943, "percentage": 28.42, "elapsed_time": "0:17:49", "remaining_time": "0:44:52", "throughput": 5882.0, "total_tokens": 6289096} {"current_steps": 9645, "total_steps": 33920, "loss": 0.3732, "lr": 9.00035026547887e-06, "epoch": 5.68691037735849, "percentage": 28.43, "elapsed_time": "0:17:49", "remaining_time": "0:44:52", "throughput": 5882.16, "total_tokens": 6292392} {"current_steps": 9650, "total_steps": 33920, "loss": 0.469, "lr": 8.998806347857537e-06, "epoch": 5.689858490566038, "percentage": 28.45, "elapsed_time": "0:17:50", "remaining_time": "0:44:51", "throughput": 5882.25, "total_tokens": 6295304} {"current_steps": 9655, "total_steps": 33920, "loss": 0.4393, "lr": 8.99726137153499e-06, "epoch": 5.692806603773585, "percentage": 28.46, "elapsed_time": "0:17:50", "remaining_time": "0:44:50", "throughput": 5882.23, "total_tokens": 6298088} {"current_steps": 9660, "total_steps": 33920, "loss": 0.4891, "lr": 8.995715336920266e-06, "epoch": 5.695754716981132, "percentage": 28.48, "elapsed_time": "0:17:51", "remaining_time": "0:44:50", "throughput": 5882.54, "total_tokens": 6301384} {"current_steps": 9665, "total_steps": 33920, "loss": 0.5764, "lr": 8.994168244422687e-06, "epoch": 5.6987028301886795, "percentage": 28.49, "elapsed_time": "0:17:51", "remaining_time": "0:44:49", "throughput": 5882.69, "total_tokens": 6304392} {"current_steps": 9670, "total_steps": 33920, "loss": 0.378, "lr": 8.992620094451852e-06, "epoch": 5.701650943396227, "percentage": 28.51, "elapsed_time": "0:17:52", "remaining_time": "0:44:49", "throughput": 5883.23, "total_tokens": 6308552} {"current_steps": 9675, "total_steps": 33920, "loss": 0.4368, "lr": 8.991070887417639e-06, "epoch": 5.704599056603773, "percentage": 28.52, "elapsed_time": "0:17:52", "remaining_time": "0:44:48", "throughput": 5883.33, "total_tokens": 6311368} {"current_steps": 9680, "total_steps": 33920, "loss": 0.4913, "lr": 8.989520623730208e-06, "epoch": 5.7075471698113205, "percentage": 28.54, "elapsed_time": "0:17:53", "remaining_time": "0:44:47", "throughput": 5883.76, "total_tokens": 6315112} {"current_steps": 9685, "total_steps": 33920, "loss": 0.5032, "lr": 8.987969303799998e-06, "epoch": 5.710495283018868, "percentage": 28.55, "elapsed_time": "0:17:53", "remaining_time": "0:44:47", "throughput": 5884.28, "total_tokens": 6319176} {"current_steps": 9690, "total_steps": 33920, "loss": 0.4111, "lr": 8.986416928037728e-06, "epoch": 5.713443396226415, "percentage": 28.57, "elapsed_time": "0:17:54", "remaining_time": "0:44:46", "throughput": 5884.25, "total_tokens": 6321832} {"current_steps": 9695, "total_steps": 33920, "loss": 0.4271, "lr": 8.984863496854395e-06, "epoch": 5.716391509433962, "percentage": 28.58, "elapsed_time": "0:17:54", "remaining_time": "0:44:45", "throughput": 5884.25, "total_tokens": 6324648} {"current_steps": 9700, "total_steps": 33920, "loss": 0.4236, "lr": 8.983309010661279e-06, "epoch": 5.71933962264151, "percentage": 28.6, "elapsed_time": "0:17:55", "remaining_time": "0:44:44", "throughput": 5884.29, "total_tokens": 6327304} {"current_steps": 9705, "total_steps": 33920, "loss": 0.6688, "lr": 8.981753469869934e-06, "epoch": 5.722287735849057, "percentage": 28.61, "elapsed_time": "0:17:55", "remaining_time": "0:44:44", "throughput": 5884.53, "total_tokens": 6330504} {"current_steps": 9710, "total_steps": 33920, "loss": 0.4468, "lr": 8.980196874892198e-06, "epoch": 5.725235849056604, "percentage": 28.63, "elapsed_time": "0:17:56", "remaining_time": "0:44:43", "throughput": 5884.54, "total_tokens": 6333192} {"current_steps": 9715, "total_steps": 33920, "loss": 0.3965, "lr": 8.978639226140184e-06, "epoch": 5.728183962264151, "percentage": 28.64, "elapsed_time": "0:17:56", "remaining_time": "0:44:42", "throughput": 5884.79, "total_tokens": 6336488} {"current_steps": 9720, "total_steps": 33920, "loss": 0.3408, "lr": 8.977080524026289e-06, "epoch": 5.731132075471698, "percentage": 28.66, "elapsed_time": "0:17:57", "remaining_time": "0:44:42", "throughput": 5885.14, "total_tokens": 6340296} {"current_steps": 9725, "total_steps": 33920, "loss": 0.5933, "lr": 8.975520768963186e-06, "epoch": 5.734080188679245, "percentage": 28.67, "elapsed_time": "0:17:57", "remaining_time": "0:44:41", "throughput": 5884.8, "total_tokens": 6342664} {"current_steps": 9730, "total_steps": 33920, "loss": 0.4087, "lr": 8.973959961363825e-06, "epoch": 5.7370283018867925, "percentage": 28.69, "elapsed_time": "0:17:58", "remaining_time": "0:44:40", "throughput": 5884.59, "total_tokens": 6345384} {"current_steps": 9735, "total_steps": 33920, "loss": 0.4258, "lr": 8.972398101641438e-06, "epoch": 5.73997641509434, "percentage": 28.7, "elapsed_time": "0:17:58", "remaining_time": "0:44:40", "throughput": 5884.29, "total_tokens": 6348104} {"current_steps": 9740, "total_steps": 33920, "loss": 0.4466, "lr": 8.970835190209532e-06, "epoch": 5.742924528301887, "percentage": 28.71, "elapsed_time": "0:17:59", "remaining_time": "0:44:41", "throughput": 5885.11, "total_tokens": 6355592} {"current_steps": 9745, "total_steps": 33920, "loss": 0.5416, "lr": 8.969271227481899e-06, "epoch": 5.745872641509434, "percentage": 28.73, "elapsed_time": "0:18:00", "remaining_time": "0:44:40", "throughput": 5885.43, "total_tokens": 6359144} {"current_steps": 9750, "total_steps": 33920, "loss": 0.4149, "lr": 8.967706213872599e-06, "epoch": 5.748820754716981, "percentage": 28.74, "elapsed_time": "0:18:01", "remaining_time": "0:44:39", "throughput": 5885.78, "total_tokens": 6362696} {"current_steps": 9755, "total_steps": 33920, "loss": 0.4449, "lr": 8.966140149795981e-06, "epoch": 5.751768867924528, "percentage": 28.76, "elapsed_time": "0:18:01", "remaining_time": "0:44:39", "throughput": 5886.1, "total_tokens": 6366120} {"current_steps": 9760, "total_steps": 33920, "loss": 0.3594, "lr": 8.964573035666663e-06, "epoch": 5.754716981132075, "percentage": 28.77, "elapsed_time": "0:18:02", "remaining_time": "0:44:38", "throughput": 5886.26, "total_tokens": 6369224} {"current_steps": 9765, "total_steps": 33920, "loss": 0.4247, "lr": 8.96300487189955e-06, "epoch": 5.757665094339623, "percentage": 28.79, "elapsed_time": "0:18:02", "remaining_time": "0:44:37", "throughput": 5886.23, "total_tokens": 6372328} {"current_steps": 9770, "total_steps": 33920, "loss": 0.5206, "lr": 8.961435658909816e-06, "epoch": 5.76061320754717, "percentage": 28.8, "elapsed_time": "0:18:03", "remaining_time": "0:44:37", "throughput": 5886.19, "total_tokens": 6375368} {"current_steps": 9775, "total_steps": 33920, "loss": 0.4524, "lr": 8.959865397112918e-06, "epoch": 5.763561320754717, "percentage": 28.82, "elapsed_time": "0:18:03", "remaining_time": "0:44:36", "throughput": 5886.34, "total_tokens": 6378440} {"current_steps": 9780, "total_steps": 33920, "loss": 0.4644, "lr": 8.95829408692459e-06, "epoch": 5.7665094339622645, "percentage": 28.83, "elapsed_time": "0:18:04", "remaining_time": "0:44:35", "throughput": 5886.22, "total_tokens": 6381096} {"current_steps": 9785, "total_steps": 33920, "loss": 0.3863, "lr": 8.956721728760845e-06, "epoch": 5.769457547169811, "percentage": 28.85, "elapsed_time": "0:18:04", "remaining_time": "0:44:35", "throughput": 5886.37, "total_tokens": 6384328} {"current_steps": 9790, "total_steps": 33920, "loss": 0.5591, "lr": 8.95514832303797e-06, "epoch": 5.772405660377358, "percentage": 28.86, "elapsed_time": "0:18:05", "remaining_time": "0:44:34", "throughput": 5886.81, "total_tokens": 6388232} {"current_steps": 9795, "total_steps": 33920, "loss": 0.3714, "lr": 8.953573870172528e-06, "epoch": 5.775353773584905, "percentage": 28.88, "elapsed_time": "0:18:05", "remaining_time": "0:44:33", "throughput": 5886.79, "total_tokens": 6390952} {"current_steps": 9800, "total_steps": 33920, "loss": 0.3962, "lr": 8.951998370581368e-06, "epoch": 5.778301886792453, "percentage": 28.89, "elapsed_time": "0:18:06", "remaining_time": "0:44:33", "throughput": 5886.75, "total_tokens": 6394472} {"current_steps": 9805, "total_steps": 33920, "loss": 0.5625, "lr": 8.950421824681605e-06, "epoch": 5.78125, "percentage": 28.91, "elapsed_time": "0:18:06", "remaining_time": "0:44:32", "throughput": 5887.21, "total_tokens": 6398312} {"current_steps": 9810, "total_steps": 33920, "loss": 0.4149, "lr": 8.948844232890638e-06, "epoch": 5.784198113207547, "percentage": 28.92, "elapsed_time": "0:18:07", "remaining_time": "0:44:32", "throughput": 5887.57, "total_tokens": 6401768} {"current_steps": 9815, "total_steps": 33920, "loss": 0.5064, "lr": 8.947265595626144e-06, "epoch": 5.787146226415095, "percentage": 28.94, "elapsed_time": "0:18:07", "remaining_time": "0:44:31", "throughput": 5887.68, "total_tokens": 6404872} {"current_steps": 9820, "total_steps": 33920, "loss": 0.4599, "lr": 8.945685913306071e-06, "epoch": 5.790094339622642, "percentage": 28.95, "elapsed_time": "0:18:08", "remaining_time": "0:44:31", "throughput": 5887.83, "total_tokens": 6408296} {"current_steps": 9825, "total_steps": 33920, "loss": 0.3621, "lr": 8.944105186348646e-06, "epoch": 5.793042452830189, "percentage": 28.97, "elapsed_time": "0:18:08", "remaining_time": "0:44:30", "throughput": 5887.99, "total_tokens": 6411464} {"current_steps": 9830, "total_steps": 33920, "loss": 0.4174, "lr": 8.942523415172377e-06, "epoch": 5.7959905660377355, "percentage": 28.98, "elapsed_time": "0:18:09", "remaining_time": "0:44:29", "throughput": 5888.07, "total_tokens": 6414408} {"current_steps": 9835, "total_steps": 33920, "loss": 0.3615, "lr": 8.94094060019604e-06, "epoch": 5.798938679245283, "percentage": 28.99, "elapsed_time": "0:18:09", "remaining_time": "0:44:29", "throughput": 5888.15, "total_tokens": 6417448} {"current_steps": 9840, "total_steps": 33920, "loss": 0.4851, "lr": 8.939356741838696e-06, "epoch": 5.80188679245283, "percentage": 29.01, "elapsed_time": "0:18:10", "remaining_time": "0:44:28", "throughput": 5888.47, "total_tokens": 6420936} {"current_steps": 9845, "total_steps": 33920, "loss": 0.3226, "lr": 8.937771840519677e-06, "epoch": 5.804834905660377, "percentage": 29.02, "elapsed_time": "0:18:10", "remaining_time": "0:44:27", "throughput": 5888.78, "total_tokens": 6424264} {"current_steps": 9850, "total_steps": 33920, "loss": 0.411, "lr": 8.936185896658593e-06, "epoch": 5.807783018867925, "percentage": 29.04, "elapsed_time": "0:18:11", "remaining_time": "0:44:26", "throughput": 5888.76, "total_tokens": 6426920} {"current_steps": 9855, "total_steps": 33920, "loss": 0.3852, "lr": 8.934598910675329e-06, "epoch": 5.810731132075472, "percentage": 29.05, "elapsed_time": "0:18:11", "remaining_time": "0:44:26", "throughput": 5888.96, "total_tokens": 6430216} {"current_steps": 9860, "total_steps": 33920, "loss": 0.4039, "lr": 8.933010882990044e-06, "epoch": 5.813679245283019, "percentage": 29.07, "elapsed_time": "0:18:12", "remaining_time": "0:44:25", "throughput": 5889.36, "total_tokens": 6434088} {"current_steps": 9865, "total_steps": 33920, "loss": 0.367, "lr": 8.93142181402318e-06, "epoch": 5.816627358490566, "percentage": 29.08, "elapsed_time": "0:18:13", "remaining_time": "0:44:25", "throughput": 5889.68, "total_tokens": 6437640} {"current_steps": 9870, "total_steps": 33920, "loss": 0.4027, "lr": 8.929831704195445e-06, "epoch": 5.819575471698113, "percentage": 29.1, "elapsed_time": "0:18:13", "remaining_time": "0:44:24", "throughput": 5889.82, "total_tokens": 6440744} {"current_steps": 9875, "total_steps": 33920, "loss": 0.3891, "lr": 8.928240553927831e-06, "epoch": 5.82252358490566, "percentage": 29.11, "elapsed_time": "0:18:13", "remaining_time": "0:44:23", "throughput": 5889.69, "total_tokens": 6443208} {"current_steps": 9880, "total_steps": 33920, "loss": 0.3448, "lr": 8.926648363641602e-06, "epoch": 5.8254716981132075, "percentage": 29.13, "elapsed_time": "0:18:14", "remaining_time": "0:44:23", "throughput": 5889.88, "total_tokens": 6446312} {"current_steps": 9885, "total_steps": 33920, "loss": 0.5208, "lr": 8.925055133758294e-06, "epoch": 5.828419811320755, "percentage": 29.14, "elapsed_time": "0:18:14", "remaining_time": "0:44:22", "throughput": 5890.16, "total_tokens": 6449640} {"current_steps": 9890, "total_steps": 33920, "loss": 0.4145, "lr": 8.923460864699723e-06, "epoch": 5.831367924528302, "percentage": 29.16, "elapsed_time": "0:18:15", "remaining_time": "0:44:21", "throughput": 5890.38, "total_tokens": 6453384} {"current_steps": 9895, "total_steps": 33920, "loss": 0.5891, "lr": 8.921865556887979e-06, "epoch": 5.834316037735849, "percentage": 29.17, "elapsed_time": "0:18:16", "remaining_time": "0:44:21", "throughput": 5890.18, "total_tokens": 6455880} {"current_steps": 9900, "total_steps": 33920, "loss": 0.4462, "lr": 8.920269210745426e-06, "epoch": 5.837264150943396, "percentage": 29.19, "elapsed_time": "0:18:16", "remaining_time": "0:44:20", "throughput": 5890.31, "total_tokens": 6458984} {"current_steps": 9905, "total_steps": 33920, "loss": 0.3977, "lr": 8.918671826694704e-06, "epoch": 5.840212264150943, "percentage": 29.2, "elapsed_time": "0:18:17", "remaining_time": "0:44:19", "throughput": 5890.57, "total_tokens": 6462344} {"current_steps": 9910, "total_steps": 33920, "loss": 0.4414, "lr": 8.91707340515873e-06, "epoch": 5.84316037735849, "percentage": 29.22, "elapsed_time": "0:18:17", "remaining_time": "0:44:19", "throughput": 5890.75, "total_tokens": 6465288} {"current_steps": 9915, "total_steps": 33920, "loss": 0.4247, "lr": 8.915473946560688e-06, "epoch": 5.846108490566038, "percentage": 29.23, "elapsed_time": "0:18:18", "remaining_time": "0:44:19", "throughput": 5891.53, "total_tokens": 6470728} {"current_steps": 9920, "total_steps": 33920, "loss": 0.5315, "lr": 8.913873451324044e-06, "epoch": 5.849056603773585, "percentage": 29.25, "elapsed_time": "0:18:18", "remaining_time": "0:44:18", "throughput": 5891.94, "total_tokens": 6474376} {"current_steps": 9925, "total_steps": 33920, "loss": 0.3625, "lr": 8.912271919872538e-06, "epoch": 5.852004716981132, "percentage": 29.26, "elapsed_time": "0:18:19", "remaining_time": "0:44:17", "throughput": 5892.24, "total_tokens": 6477672} {"current_steps": 9930, "total_steps": 33920, "loss": 0.5733, "lr": 8.910669352630176e-06, "epoch": 5.8549528301886795, "percentage": 29.27, "elapsed_time": "0:18:19", "remaining_time": "0:44:17", "throughput": 5892.07, "total_tokens": 6480136} {"current_steps": 9935, "total_steps": 33920, "loss": 0.3553, "lr": 8.909065750021253e-06, "epoch": 5.857900943396227, "percentage": 29.29, "elapsed_time": "0:18:20", "remaining_time": "0:44:16", "throughput": 5892.29, "total_tokens": 6483240} {"current_steps": 9940, "total_steps": 33920, "loss": 0.5216, "lr": 8.907461112470323e-06, "epoch": 5.860849056603773, "percentage": 29.3, "elapsed_time": "0:18:20", "remaining_time": "0:44:15", "throughput": 5892.47, "total_tokens": 6486600} {"current_steps": 9945, "total_steps": 33920, "loss": 0.4096, "lr": 8.905855440402225e-06, "epoch": 5.8637971698113205, "percentage": 29.32, "elapsed_time": "0:18:21", "remaining_time": "0:44:14", "throughput": 5892.31, "total_tokens": 6489128} {"current_steps": 9950, "total_steps": 33920, "loss": 0.5143, "lr": 8.904248734242065e-06, "epoch": 5.866745283018868, "percentage": 29.33, "elapsed_time": "0:18:21", "remaining_time": "0:44:14", "throughput": 5892.16, "total_tokens": 6491976} {"current_steps": 9955, "total_steps": 33920, "loss": 0.4387, "lr": 8.902640994415226e-06, "epoch": 5.869693396226415, "percentage": 29.35, "elapsed_time": "0:18:22", "remaining_time": "0:44:13", "throughput": 5892.32, "total_tokens": 6495464} {"current_steps": 9960, "total_steps": 33920, "loss": 0.4629, "lr": 8.901032221347364e-06, "epoch": 5.872641509433962, "percentage": 29.36, "elapsed_time": "0:18:22", "remaining_time": "0:44:13", "throughput": 5892.3, "total_tokens": 6498344} {"current_steps": 9965, "total_steps": 33920, "loss": 0.4315, "lr": 8.899422415464409e-06, "epoch": 5.87558962264151, "percentage": 29.38, "elapsed_time": "0:18:23", "remaining_time": "0:44:12", "throughput": 5892.64, "total_tokens": 6501864} {"current_steps": 9970, "total_steps": 33920, "loss": 0.5162, "lr": 8.897811577192565e-06, "epoch": 5.878537735849057, "percentage": 29.39, "elapsed_time": "0:18:23", "remaining_time": "0:44:11", "throughput": 5892.67, "total_tokens": 6504776} {"current_steps": 9975, "total_steps": 33920, "loss": 0.3986, "lr": 8.896199706958306e-06, "epoch": 5.881485849056604, "percentage": 29.41, "elapsed_time": "0:18:24", "remaining_time": "0:44:11", "throughput": 5892.81, "total_tokens": 6507912} {"current_steps": 9980, "total_steps": 33920, "loss": 0.4826, "lr": 8.894586805188384e-06, "epoch": 5.884433962264151, "percentage": 29.42, "elapsed_time": "0:18:24", "remaining_time": "0:44:10", "throughput": 5892.73, "total_tokens": 6510632} {"current_steps": 9985, "total_steps": 33920, "loss": 0.3284, "lr": 8.892972872309821e-06, "epoch": 5.887382075471698, "percentage": 29.44, "elapsed_time": "0:18:25", "remaining_time": "0:44:09", "throughput": 5892.69, "total_tokens": 6513640} {"current_steps": 9990, "total_steps": 33920, "loss": 0.4495, "lr": 8.89135790874991e-06, "epoch": 5.890330188679245, "percentage": 29.45, "elapsed_time": "0:18:25", "remaining_time": "0:44:09", "throughput": 5893.0, "total_tokens": 6517384} {"current_steps": 9995, "total_steps": 33920, "loss": 0.4596, "lr": 8.889741914936224e-06, "epoch": 5.8932783018867925, "percentage": 29.47, "elapsed_time": "0:18:26", "remaining_time": "0:44:08", "throughput": 5893.22, "total_tokens": 6520680} {"current_steps": 10000, "total_steps": 33920, "loss": 0.3534, "lr": 8.888124891296602e-06, "epoch": 5.89622641509434, "percentage": 29.48, "elapsed_time": "0:18:27", "remaining_time": "0:44:08", "throughput": 5893.43, "total_tokens": 6524264} {"current_steps": 10005, "total_steps": 33920, "loss": 0.4953, "lr": 8.886506838259156e-06, "epoch": 5.899174528301887, "percentage": 29.5, "elapsed_time": "0:18:27", "remaining_time": "0:44:07", "throughput": 5893.68, "total_tokens": 6527624} {"current_steps": 10010, "total_steps": 33920, "loss": 0.4272, "lr": 8.884887756252279e-06, "epoch": 5.902122641509434, "percentage": 29.51, "elapsed_time": "0:18:28", "remaining_time": "0:44:06", "throughput": 5893.54, "total_tokens": 6530184} {"current_steps": 10015, "total_steps": 33920, "loss": 0.3933, "lr": 8.88326764570462e-06, "epoch": 5.905070754716981, "percentage": 29.53, "elapsed_time": "0:18:28", "remaining_time": "0:44:06", "throughput": 5893.8, "total_tokens": 6534152} {"current_steps": 10020, "total_steps": 33920, "loss": 0.3367, "lr": 8.88164650704512e-06, "epoch": 5.908018867924528, "percentage": 29.54, "elapsed_time": "0:18:29", "remaining_time": "0:44:05", "throughput": 5893.99, "total_tokens": 6537544} {"current_steps": 10025, "total_steps": 33920, "loss": 0.5126, "lr": 8.880024340702978e-06, "epoch": 5.910966981132075, "percentage": 29.55, "elapsed_time": "0:18:29", "remaining_time": "0:44:04", "throughput": 5893.86, "total_tokens": 6540232} {"current_steps": 10030, "total_steps": 33920, "loss": 0.3383, "lr": 8.878401147107667e-06, "epoch": 5.913915094339623, "percentage": 29.57, "elapsed_time": "0:18:30", "remaining_time": "0:44:04", "throughput": 5894.3, "total_tokens": 6544328} {"current_steps": 10035, "total_steps": 33920, "loss": 0.442, "lr": 8.87677692668894e-06, "epoch": 5.91686320754717, "percentage": 29.58, "elapsed_time": "0:18:30", "remaining_time": "0:44:03", "throughput": 5894.57, "total_tokens": 6547624} {"current_steps": 10040, "total_steps": 33920, "loss": 0.6714, "lr": 8.875151679876813e-06, "epoch": 5.919811320754717, "percentage": 29.6, "elapsed_time": "0:18:31", "remaining_time": "0:44:03", "throughput": 5894.9, "total_tokens": 6551080} {"current_steps": 10045, "total_steps": 33920, "loss": 0.4746, "lr": 8.873525407101577e-06, "epoch": 5.9227594339622645, "percentage": 29.61, "elapsed_time": "0:18:31", "remaining_time": "0:44:02", "throughput": 5894.85, "total_tokens": 6554120} {"current_steps": 10050, "total_steps": 33920, "loss": 0.4872, "lr": 8.871898108793796e-06, "epoch": 5.925707547169811, "percentage": 29.63, "elapsed_time": "0:18:32", "remaining_time": "0:44:01", "throughput": 5894.89, "total_tokens": 6557000} {"current_steps": 10055, "total_steps": 33920, "loss": 0.4556, "lr": 8.870269785384304e-06, "epoch": 5.928655660377358, "percentage": 29.64, "elapsed_time": "0:18:32", "remaining_time": "0:44:01", "throughput": 5895.16, "total_tokens": 6560328} {"current_steps": 10060, "total_steps": 33920, "loss": 0.4022, "lr": 8.868640437304206e-06, "epoch": 5.931603773584905, "percentage": 29.66, "elapsed_time": "0:18:33", "remaining_time": "0:44:00", "throughput": 5895.33, "total_tokens": 6563432} {"current_steps": 10065, "total_steps": 33920, "loss": 0.5331, "lr": 8.86701006498488e-06, "epoch": 5.934551886792453, "percentage": 29.67, "elapsed_time": "0:18:33", "remaining_time": "0:43:59", "throughput": 5895.44, "total_tokens": 6566472} {"current_steps": 10070, "total_steps": 33920, "loss": 0.4415, "lr": 8.865378668857972e-06, "epoch": 5.9375, "percentage": 29.69, "elapsed_time": "0:18:34", "remaining_time": "0:43:59", "throughput": 5895.69, "total_tokens": 6570376} {"current_steps": 10075, "total_steps": 33920, "loss": 0.6459, "lr": 8.863746249355404e-06, "epoch": 5.940448113207547, "percentage": 29.7, "elapsed_time": "0:18:34", "remaining_time": "0:43:58", "throughput": 5895.44, "total_tokens": 6572712} {"current_steps": 10080, "total_steps": 33920, "loss": 0.5066, "lr": 8.862112806909365e-06, "epoch": 5.943396226415095, "percentage": 29.72, "elapsed_time": "0:18:35", "remaining_time": "0:43:58", "throughput": 5895.33, "total_tokens": 6575688} {"current_steps": 10085, "total_steps": 33920, "loss": 0.5235, "lr": 8.860478341952314e-06, "epoch": 5.946344339622642, "percentage": 29.73, "elapsed_time": "0:18:35", "remaining_time": "0:43:57", "throughput": 5895.51, "total_tokens": 6578696} {"current_steps": 10090, "total_steps": 33920, "loss": 0.3276, "lr": 8.858842854916985e-06, "epoch": 5.949292452830189, "percentage": 29.75, "elapsed_time": "0:18:36", "remaining_time": "0:43:56", "throughput": 5895.17, "total_tokens": 6581096} {"current_steps": 10095, "total_steps": 33920, "loss": 0.4287, "lr": 8.85720634623638e-06, "epoch": 5.9522405660377355, "percentage": 29.76, "elapsed_time": "0:18:36", "remaining_time": "0:43:55", "throughput": 5895.56, "total_tokens": 6584712} {"current_steps": 10100, "total_steps": 33920, "loss": 0.4793, "lr": 8.855568816343769e-06, "epoch": 5.955188679245283, "percentage": 29.78, "elapsed_time": "0:18:37", "remaining_time": "0:43:55", "throughput": 5895.65, "total_tokens": 6587624} {"current_steps": 10105, "total_steps": 33920, "loss": 0.462, "lr": 8.8539302656727e-06, "epoch": 5.95813679245283, "percentage": 29.79, "elapsed_time": "0:18:37", "remaining_time": "0:43:54", "throughput": 5895.68, "total_tokens": 6590568} {"current_steps": 10110, "total_steps": 33920, "loss": 0.5579, "lr": 8.852290694656983e-06, "epoch": 5.961084905660377, "percentage": 29.81, "elapsed_time": "0:18:38", "remaining_time": "0:43:53", "throughput": 5895.81, "total_tokens": 6593832} {"current_steps": 10115, "total_steps": 33920, "loss": 0.4579, "lr": 8.8506501037307e-06, "epoch": 5.964033018867925, "percentage": 29.82, "elapsed_time": "0:18:38", "remaining_time": "0:43:53", "throughput": 5895.82, "total_tokens": 6596488} {"current_steps": 10120, "total_steps": 33920, "loss": 0.3538, "lr": 8.849008493328209e-06, "epoch": 5.966981132075472, "percentage": 29.83, "elapsed_time": "0:18:39", "remaining_time": "0:43:52", "throughput": 5895.74, "total_tokens": 6599080} {"current_steps": 10125, "total_steps": 33920, "loss": 0.4391, "lr": 8.847365863884131e-06, "epoch": 5.969929245283019, "percentage": 29.85, "elapsed_time": "0:18:39", "remaining_time": "0:43:51", "throughput": 5895.9, "total_tokens": 6602088} {"current_steps": 10130, "total_steps": 33920, "loss": 0.3039, "lr": 8.845722215833359e-06, "epoch": 5.972877358490566, "percentage": 29.86, "elapsed_time": "0:18:40", "remaining_time": "0:43:50", "throughput": 5895.84, "total_tokens": 6604648} {"current_steps": 10135, "total_steps": 33920, "loss": 0.3713, "lr": 8.844077549611056e-06, "epoch": 5.975825471698113, "percentage": 29.88, "elapsed_time": "0:18:40", "remaining_time": "0:43:50", "throughput": 5896.18, "total_tokens": 6608552} {"current_steps": 10140, "total_steps": 33920, "loss": 0.4916, "lr": 8.842431865652654e-06, "epoch": 5.97877358490566, "percentage": 29.89, "elapsed_time": "0:18:41", "remaining_time": "0:43:49", "throughput": 5896.42, "total_tokens": 6612072} {"current_steps": 10145, "total_steps": 33920, "loss": 0.451, "lr": 8.840785164393858e-06, "epoch": 5.9817216981132075, "percentage": 29.91, "elapsed_time": "0:18:41", "remaining_time": "0:43:48", "throughput": 5896.2, "total_tokens": 6614440} {"current_steps": 10150, "total_steps": 33920, "loss": 0.4549, "lr": 8.839137446270634e-06, "epoch": 5.984669811320755, "percentage": 29.92, "elapsed_time": "0:18:42", "remaining_time": "0:43:48", "throughput": 5896.55, "total_tokens": 6618024} {"current_steps": 10155, "total_steps": 33920, "loss": 0.4564, "lr": 8.837488711719226e-06, "epoch": 5.987617924528302, "percentage": 29.94, "elapsed_time": "0:18:42", "remaining_time": "0:43:47", "throughput": 5896.72, "total_tokens": 6621192} {"current_steps": 10160, "total_steps": 33920, "loss": 0.4378, "lr": 8.835838961176143e-06, "epoch": 5.990566037735849, "percentage": 29.95, "elapsed_time": "0:18:43", "remaining_time": "0:43:46", "throughput": 5896.45, "total_tokens": 6623592} {"current_steps": 10165, "total_steps": 33920, "loss": 0.3693, "lr": 8.834188195078164e-06, "epoch": 5.993514150943396, "percentage": 29.97, "elapsed_time": "0:18:43", "remaining_time": "0:43:46", "throughput": 5896.54, "total_tokens": 6626504} {"current_steps": 10170, "total_steps": 33920, "loss": 0.3843, "lr": 8.832536413862337e-06, "epoch": 5.996462264150943, "percentage": 29.98, "elapsed_time": "0:18:44", "remaining_time": "0:43:45", "throughput": 5896.81, "total_tokens": 6629800} {"current_steps": 10175, "total_steps": 33920, "loss": 0.5516, "lr": 8.830883617965976e-06, "epoch": 5.99941037735849, "percentage": 30.0, "elapsed_time": "0:18:44", "remaining_time": "0:43:44", "throughput": 5896.68, "total_tokens": 6632680} {"current_steps": 10176, "total_steps": 33920, "eval_loss": 0.5020108222961426, "epoch": 6.0, "percentage": 30.0, "elapsed_time": "0:19:04", "remaining_time": "0:44:29", "throughput": 5796.75, "total_tokens": 6632800} {"current_steps": 10180, "total_steps": 33920, "loss": 0.3397, "lr": 8.829229807826665e-06, "epoch": 6.002358490566038, "percentage": 30.01, "elapsed_time": "0:19:07", "remaining_time": "0:44:36", "throughput": 5780.31, "total_tokens": 6634976} {"current_steps": 10185, "total_steps": 33920, "loss": 0.3627, "lr": 8.82757498388226e-06, "epoch": 6.005306603773585, "percentage": 30.03, "elapsed_time": "0:19:08", "remaining_time": "0:44:36", "throughput": 5779.88, "total_tokens": 6637536} {"current_steps": 10190, "total_steps": 33920, "loss": 0.3804, "lr": 8.825919146570884e-06, "epoch": 6.008254716981132, "percentage": 30.04, "elapsed_time": "0:19:08", "remaining_time": "0:44:35", "throughput": 5780.24, "total_tokens": 6641152} {"current_steps": 10195, "total_steps": 33920, "loss": 0.4702, "lr": 8.824262296330925e-06, "epoch": 6.0112028301886795, "percentage": 30.06, "elapsed_time": "0:19:09", "remaining_time": "0:44:34", "throughput": 5780.1, "total_tokens": 6644064} {"current_steps": 10200, "total_steps": 33920, "loss": 0.4001, "lr": 8.822604433601041e-06, "epoch": 6.014150943396227, "percentage": 30.07, "elapsed_time": "0:19:10", "remaining_time": "0:44:34", "throughput": 5780.37, "total_tokens": 6647488} {"current_steps": 10205, "total_steps": 33920, "loss": 0.3117, "lr": 8.820945558820158e-06, "epoch": 6.017099056603773, "percentage": 30.09, "elapsed_time": "0:19:10", "remaining_time": "0:44:33", "throughput": 5779.64, "total_tokens": 6649792} {"current_steps": 10210, "total_steps": 33920, "loss": 0.4939, "lr": 8.81928567242747e-06, "epoch": 6.0200471698113205, "percentage": 30.1, "elapsed_time": "0:19:11", "remaining_time": "0:44:33", "throughput": 5778.88, "total_tokens": 6652672} {"current_steps": 10215, "total_steps": 33920, "loss": 0.5602, "lr": 8.817624774862443e-06, "epoch": 6.022995283018868, "percentage": 30.11, "elapsed_time": "0:19:11", "remaining_time": "0:44:32", "throughput": 5778.98, "total_tokens": 6656224} {"current_steps": 10220, "total_steps": 33920, "loss": 0.4647, "lr": 8.815962866564803e-06, "epoch": 6.025943396226415, "percentage": 30.13, "elapsed_time": "0:19:12", "remaining_time": "0:44:32", "throughput": 5779.38, "total_tokens": 6659840} {"current_steps": 10225, "total_steps": 33920, "loss": 0.4868, "lr": 8.814299947974547e-06, "epoch": 6.028891509433962, "percentage": 30.14, "elapsed_time": "0:19:12", "remaining_time": "0:44:31", "throughput": 5779.43, "total_tokens": 6663168} {"current_steps": 10230, "total_steps": 33920, "loss": 0.4054, "lr": 8.812636019531942e-06, "epoch": 6.03183962264151, "percentage": 30.16, "elapsed_time": "0:19:13", "remaining_time": "0:44:31", "throughput": 5779.18, "total_tokens": 6665792} {"current_steps": 10235, "total_steps": 33920, "loss": 0.3985, "lr": 8.810971081677517e-06, "epoch": 6.034787735849057, "percentage": 30.17, "elapsed_time": "0:19:13", "remaining_time": "0:44:30", "throughput": 5779.38, "total_tokens": 6668928} {"current_steps": 10240, "total_steps": 33920, "loss": 0.5117, "lr": 8.809305134852076e-06, "epoch": 6.037735849056604, "percentage": 30.19, "elapsed_time": "0:19:14", "remaining_time": "0:44:29", "throughput": 5779.32, "total_tokens": 6671616} {"current_steps": 10245, "total_steps": 33920, "loss": 0.5803, "lr": 8.807638179496684e-06, "epoch": 6.040683962264151, "percentage": 30.2, "elapsed_time": "0:19:14", "remaining_time": "0:44:28", "throughput": 5779.5, "total_tokens": 6674912} {"current_steps": 10250, "total_steps": 33920, "loss": 0.586, "lr": 8.805970216052673e-06, "epoch": 6.043632075471698, "percentage": 30.22, "elapsed_time": "0:19:15", "remaining_time": "0:44:28", "throughput": 5780.02, "total_tokens": 6679072} {"current_steps": 10255, "total_steps": 33920, "loss": 0.4251, "lr": 8.804301244961645e-06, "epoch": 6.046580188679245, "percentage": 30.23, "elapsed_time": "0:19:16", "remaining_time": "0:44:27", "throughput": 5780.04, "total_tokens": 6681824} {"current_steps": 10260, "total_steps": 33920, "loss": 0.3436, "lr": 8.802631266665465e-06, "epoch": 6.0495283018867925, "percentage": 30.25, "elapsed_time": "0:19:16", "remaining_time": "0:44:27", "throughput": 5780.3, "total_tokens": 6685088} {"current_steps": 10265, "total_steps": 33920, "loss": 0.485, "lr": 8.80096028160627e-06, "epoch": 6.05247641509434, "percentage": 30.26, "elapsed_time": "0:19:17", "remaining_time": "0:44:26", "throughput": 5779.83, "total_tokens": 6687552} {"current_steps": 10270, "total_steps": 33920, "loss": 0.3963, "lr": 8.799288290226457e-06, "epoch": 6.055424528301887, "percentage": 30.28, "elapsed_time": "0:19:17", "remaining_time": "0:44:25", "throughput": 5779.86, "total_tokens": 6690560} {"current_steps": 10275, "total_steps": 33920, "loss": 0.4803, "lr": 8.797615292968698e-06, "epoch": 6.058372641509434, "percentage": 30.29, "elapsed_time": "0:19:18", "remaining_time": "0:44:25", "throughput": 5780.31, "total_tokens": 6694432} {"current_steps": 10280, "total_steps": 33920, "loss": 0.3813, "lr": 8.795941290275923e-06, "epoch": 6.061320754716981, "percentage": 30.31, "elapsed_time": "0:19:18", "remaining_time": "0:44:24", "throughput": 5780.56, "total_tokens": 6697568} {"current_steps": 10285, "total_steps": 33920, "loss": 0.3476, "lr": 8.79426628259133e-06, "epoch": 6.064268867924528, "percentage": 30.32, "elapsed_time": "0:19:19", "remaining_time": "0:44:23", "throughput": 5780.82, "total_tokens": 6701184} {"current_steps": 10290, "total_steps": 33920, "loss": 0.4239, "lr": 8.792590270358389e-06, "epoch": 6.067216981132075, "percentage": 30.34, "elapsed_time": "0:19:19", "remaining_time": "0:44:23", "throughput": 5780.94, "total_tokens": 6704160} {"current_steps": 10295, "total_steps": 33920, "loss": 0.4336, "lr": 8.790913254020827e-06, "epoch": 6.070165094339623, "percentage": 30.35, "elapsed_time": "0:19:20", "remaining_time": "0:44:22", "throughput": 5780.48, "total_tokens": 6706432} {"current_steps": 10300, "total_steps": 33920, "loss": 0.4422, "lr": 8.789235234022643e-06, "epoch": 6.07311320754717, "percentage": 30.37, "elapsed_time": "0:19:20", "remaining_time": "0:44:21", "throughput": 5780.76, "total_tokens": 6709760} {"current_steps": 10305, "total_steps": 33920, "loss": 0.2895, "lr": 8.787556210808101e-06, "epoch": 6.076061320754717, "percentage": 30.38, "elapsed_time": "0:19:21", "remaining_time": "0:44:21", "throughput": 5781.12, "total_tokens": 6713248} {"current_steps": 10310, "total_steps": 33920, "loss": 0.5111, "lr": 8.78587618482173e-06, "epoch": 6.0790094339622645, "percentage": 30.4, "elapsed_time": "0:19:21", "remaining_time": "0:44:20", "throughput": 5781.12, "total_tokens": 6715904} {"current_steps": 10315, "total_steps": 33920, "loss": 0.3387, "lr": 8.78419515650832e-06, "epoch": 6.081957547169812, "percentage": 30.41, "elapsed_time": "0:19:22", "remaining_time": "0:44:20", "throughput": 5781.7, "total_tokens": 6721120} {"current_steps": 10320, "total_steps": 33920, "loss": 0.4124, "lr": 8.782513126312934e-06, "epoch": 6.084905660377358, "percentage": 30.42, "elapsed_time": "0:19:22", "remaining_time": "0:44:19", "throughput": 5781.79, "total_tokens": 6724160} {"current_steps": 10325, "total_steps": 33920, "loss": 0.5492, "lr": 8.780830094680897e-06, "epoch": 6.087853773584905, "percentage": 30.44, "elapsed_time": "0:19:23", "remaining_time": "0:44:19", "throughput": 5782.17, "total_tokens": 6728096} {"current_steps": 10330, "total_steps": 33920, "loss": 0.4293, "lr": 8.779146062057797e-06, "epoch": 6.090801886792453, "percentage": 30.45, "elapsed_time": "0:19:24", "remaining_time": "0:44:18", "throughput": 5782.4, "total_tokens": 6731392} {"current_steps": 10335, "total_steps": 33920, "loss": 0.4462, "lr": 8.777461028889492e-06, "epoch": 6.09375, "percentage": 30.47, "elapsed_time": "0:19:24", "remaining_time": "0:44:18", "throughput": 5783.02, "total_tokens": 6735776} {"current_steps": 10340, "total_steps": 33920, "loss": 0.3952, "lr": 8.775774995622097e-06, "epoch": 6.096698113207547, "percentage": 30.48, "elapsed_time": "0:19:25", "remaining_time": "0:44:17", "throughput": 5783.05, "total_tokens": 6738656} {"current_steps": 10345, "total_steps": 33920, "loss": 0.5506, "lr": 8.774087962702e-06, "epoch": 6.099646226415095, "percentage": 30.5, "elapsed_time": "0:19:25", "remaining_time": "0:44:16", "throughput": 5783.23, "total_tokens": 6741856} {"current_steps": 10350, "total_steps": 33920, "loss": 0.4465, "lr": 8.772399930575849e-06, "epoch": 6.102594339622642, "percentage": 30.51, "elapsed_time": "0:19:26", "remaining_time": "0:44:16", "throughput": 5783.83, "total_tokens": 6746240} {"current_steps": 10355, "total_steps": 33920, "loss": 0.7837, "lr": 8.77071089969056e-06, "epoch": 6.105542452830188, "percentage": 30.53, "elapsed_time": "0:19:26", "remaining_time": "0:44:15", "throughput": 5783.78, "total_tokens": 6749088} {"current_steps": 10360, "total_steps": 33920, "loss": 0.3996, "lr": 8.769020870493309e-06, "epoch": 6.1084905660377355, "percentage": 30.54, "elapsed_time": "0:19:27", "remaining_time": "0:44:14", "throughput": 5783.4, "total_tokens": 6751392} {"current_steps": 10365, "total_steps": 33920, "loss": 0.4884, "lr": 8.767329843431537e-06, "epoch": 6.111438679245283, "percentage": 30.56, "elapsed_time": "0:19:27", "remaining_time": "0:44:14", "throughput": 5783.73, "total_tokens": 6755072} {"current_steps": 10370, "total_steps": 33920, "loss": 0.4144, "lr": 8.765637818952954e-06, "epoch": 6.11438679245283, "percentage": 30.57, "elapsed_time": "0:19:28", "remaining_time": "0:44:13", "throughput": 5783.69, "total_tokens": 6757696} {"current_steps": 10375, "total_steps": 33920, "loss": 0.344, "lr": 8.76394479750553e-06, "epoch": 6.117334905660377, "percentage": 30.59, "elapsed_time": "0:19:28", "remaining_time": "0:44:12", "throughput": 5783.81, "total_tokens": 6760736} {"current_steps": 10380, "total_steps": 33920, "loss": 0.5142, "lr": 8.762250779537499e-06, "epoch": 6.120283018867925, "percentage": 30.6, "elapsed_time": "0:19:29", "remaining_time": "0:44:11", "throughput": 5783.89, "total_tokens": 6763680} {"current_steps": 10385, "total_steps": 33920, "loss": 0.3207, "lr": 8.760555765497358e-06, "epoch": 6.123231132075472, "percentage": 30.62, "elapsed_time": "0:19:29", "remaining_time": "0:44:11", "throughput": 5783.98, "total_tokens": 6766496} {"current_steps": 10390, "total_steps": 33920, "loss": 0.3245, "lr": 8.758859755833873e-06, "epoch": 6.126179245283019, "percentage": 30.63, "elapsed_time": "0:19:30", "remaining_time": "0:44:10", "throughput": 5783.86, "total_tokens": 6769280} {"current_steps": 10395, "total_steps": 33920, "loss": 0.4854, "lr": 8.757162750996066e-06, "epoch": 6.129127358490566, "percentage": 30.65, "elapsed_time": "0:19:30", "remaining_time": "0:44:09", "throughput": 5783.94, "total_tokens": 6772064} {"current_steps": 10400, "total_steps": 33920, "loss": 0.4088, "lr": 8.755464751433229e-06, "epoch": 6.132075471698113, "percentage": 30.66, "elapsed_time": "0:19:31", "remaining_time": "0:44:09", "throughput": 5784.1, "total_tokens": 6775200} {"current_steps": 10405, "total_steps": 33920, "loss": 0.4999, "lr": 8.753765757594915e-06, "epoch": 6.13502358490566, "percentage": 30.68, "elapsed_time": "0:19:31", "remaining_time": "0:44:08", "throughput": 5784.43, "total_tokens": 6778784} {"current_steps": 10410, "total_steps": 33920, "loss": 0.4165, "lr": 8.752065769930938e-06, "epoch": 6.1379716981132075, "percentage": 30.69, "elapsed_time": "0:19:32", "remaining_time": "0:44:07", "throughput": 5784.37, "total_tokens": 6781536} {"current_steps": 10415, "total_steps": 33920, "loss": 0.3385, "lr": 8.75036478889138e-06, "epoch": 6.140919811320755, "percentage": 30.7, "elapsed_time": "0:19:32", "remaining_time": "0:44:06", "throughput": 5784.15, "total_tokens": 6784064} {"current_steps": 10420, "total_steps": 33920, "loss": 0.4212, "lr": 8.748662814926576e-06, "epoch": 6.143867924528302, "percentage": 30.72, "elapsed_time": "0:19:33", "remaining_time": "0:44:06", "throughput": 5784.81, "total_tokens": 6788736} {"current_steps": 10425, "total_steps": 33920, "loss": 0.3795, "lr": 8.746959848487139e-06, "epoch": 6.146816037735849, "percentage": 30.73, "elapsed_time": "0:19:34", "remaining_time": "0:44:06", "throughput": 5785.07, "total_tokens": 6792256} {"current_steps": 10430, "total_steps": 33920, "loss": 0.3895, "lr": 8.745255890023934e-06, "epoch": 6.149764150943396, "percentage": 30.75, "elapsed_time": "0:19:34", "remaining_time": "0:44:05", "throughput": 5785.29, "total_tokens": 6795648} {"current_steps": 10435, "total_steps": 33920, "loss": 0.3765, "lr": 8.74355093998809e-06, "epoch": 6.152712264150943, "percentage": 30.76, "elapsed_time": "0:19:35", "remaining_time": "0:44:04", "throughput": 5785.32, "total_tokens": 6798784} {"current_steps": 10440, "total_steps": 33920, "loss": 0.3448, "lr": 8.741844998831001e-06, "epoch": 6.15566037735849, "percentage": 30.78, "elapsed_time": "0:19:35", "remaining_time": "0:44:04", "throughput": 5785.6, "total_tokens": 6802432} {"current_steps": 10445, "total_steps": 33920, "loss": 0.4029, "lr": 8.740138067004323e-06, "epoch": 6.158608490566038, "percentage": 30.79, "elapsed_time": "0:19:36", "remaining_time": "0:44:03", "throughput": 5785.6, "total_tokens": 6805312} {"current_steps": 10450, "total_steps": 33920, "loss": 0.4001, "lr": 8.738430144959973e-06, "epoch": 6.161556603773585, "percentage": 30.81, "elapsed_time": "0:19:36", "remaining_time": "0:44:02", "throughput": 5785.77, "total_tokens": 6808640} {"current_steps": 10455, "total_steps": 33920, "loss": 0.4271, "lr": 8.73672123315013e-06, "epoch": 6.164504716981132, "percentage": 30.82, "elapsed_time": "0:19:37", "remaining_time": "0:44:02", "throughput": 5785.68, "total_tokens": 6811328} {"current_steps": 10460, "total_steps": 33920, "loss": 0.411, "lr": 8.735011332027234e-06, "epoch": 6.1674528301886795, "percentage": 30.84, "elapsed_time": "0:19:37", "remaining_time": "0:44:01", "throughput": 5785.82, "total_tokens": 6814400} {"current_steps": 10465, "total_steps": 33920, "loss": 0.5188, "lr": 8.733300442043993e-06, "epoch": 6.170400943396227, "percentage": 30.85, "elapsed_time": "0:19:38", "remaining_time": "0:44:00", "throughput": 5785.84, "total_tokens": 6817312} {"current_steps": 10470, "total_steps": 33920, "loss": 0.6431, "lr": 8.73158856365337e-06, "epoch": 6.173349056603773, "percentage": 30.87, "elapsed_time": "0:19:38", "remaining_time": "0:44:00", "throughput": 5785.88, "total_tokens": 6820192} {"current_steps": 10475, "total_steps": 33920, "loss": 0.3565, "lr": 8.729875697308592e-06, "epoch": 6.1762971698113205, "percentage": 30.88, "elapsed_time": "0:19:39", "remaining_time": "0:43:59", "throughput": 5786.02, "total_tokens": 6823264} {"current_steps": 10480, "total_steps": 33920, "loss": 0.4331, "lr": 8.728161843463148e-06, "epoch": 6.179245283018868, "percentage": 30.9, "elapsed_time": "0:19:39", "remaining_time": "0:43:58", "throughput": 5785.85, "total_tokens": 6825888} {"current_steps": 10485, "total_steps": 33920, "loss": 0.6685, "lr": 8.726447002570791e-06, "epoch": 6.182193396226415, "percentage": 30.91, "elapsed_time": "0:19:40", "remaining_time": "0:43:58", "throughput": 5786.21, "total_tokens": 6829760} {"current_steps": 10490, "total_steps": 33920, "loss": 0.4639, "lr": 8.724731175085526e-06, "epoch": 6.185141509433962, "percentage": 30.93, "elapsed_time": "0:19:40", "remaining_time": "0:43:57", "throughput": 5786.18, "total_tokens": 6832416} {"current_steps": 10495, "total_steps": 33920, "loss": 0.3098, "lr": 8.723014361461633e-06, "epoch": 6.18808962264151, "percentage": 30.94, "elapsed_time": "0:19:41", "remaining_time": "0:43:56", "throughput": 5786.51, "total_tokens": 6835776} {"current_steps": 10500, "total_steps": 33920, "loss": 0.406, "lr": 8.72129656215364e-06, "epoch": 6.191037735849057, "percentage": 30.96, "elapsed_time": "0:19:41", "remaining_time": "0:43:56", "throughput": 5786.7, "total_tokens": 6839328} {"current_steps": 10505, "total_steps": 33920, "loss": 0.3585, "lr": 8.719577777616347e-06, "epoch": 6.193985849056604, "percentage": 30.97, "elapsed_time": "0:19:42", "remaining_time": "0:43:55", "throughput": 5786.56, "total_tokens": 6841888} {"current_steps": 10510, "total_steps": 33920, "loss": 0.409, "lr": 8.717858008304804e-06, "epoch": 6.196933962264151, "percentage": 30.98, "elapsed_time": "0:19:42", "remaining_time": "0:43:54", "throughput": 5786.69, "total_tokens": 6845056} {"current_steps": 10515, "total_steps": 33920, "loss": 0.4572, "lr": 8.71613725467433e-06, "epoch": 6.199882075471698, "percentage": 31.0, "elapsed_time": "0:19:43", "remaining_time": "0:43:54", "throughput": 5786.67, "total_tokens": 6847872} {"current_steps": 10520, "total_steps": 33920, "loss": 0.3304, "lr": 8.714415517180506e-06, "epoch": 6.202830188679245, "percentage": 31.01, "elapsed_time": "0:19:43", "remaining_time": "0:43:53", "throughput": 5787.03, "total_tokens": 6851776} {"current_steps": 10525, "total_steps": 33920, "loss": 0.38, "lr": 8.712692796279164e-06, "epoch": 6.2057783018867925, "percentage": 31.03, "elapsed_time": "0:19:44", "remaining_time": "0:43:53", "throughput": 5787.61, "total_tokens": 6856832} {"current_steps": 10530, "total_steps": 33920, "loss": 0.3287, "lr": 8.710969092426401e-06, "epoch": 6.20872641509434, "percentage": 31.04, "elapsed_time": "0:19:45", "remaining_time": "0:43:52", "throughput": 5787.46, "total_tokens": 6859296} {"current_steps": 10535, "total_steps": 33920, "loss": 0.5329, "lr": 8.70924440607858e-06, "epoch": 6.211674528301887, "percentage": 31.06, "elapsed_time": "0:19:45", "remaining_time": "0:43:51", "throughput": 5787.55, "total_tokens": 6862304} {"current_steps": 10540, "total_steps": 33920, "loss": 0.4738, "lr": 8.707518737692315e-06, "epoch": 6.214622641509434, "percentage": 31.07, "elapsed_time": "0:19:46", "remaining_time": "0:43:51", "throughput": 5787.52, "total_tokens": 6865248} {"current_steps": 10545, "total_steps": 33920, "loss": 0.2997, "lr": 8.705792087724485e-06, "epoch": 6.217570754716981, "percentage": 31.09, "elapsed_time": "0:19:46", "remaining_time": "0:43:50", "throughput": 5787.62, "total_tokens": 6868032} {"current_steps": 10550, "total_steps": 33920, "loss": 0.4927, "lr": 8.704064456632231e-06, "epoch": 6.220518867924528, "percentage": 31.1, "elapsed_time": "0:19:47", "remaining_time": "0:43:49", "throughput": 5788.05, "total_tokens": 6871936} {"current_steps": 10555, "total_steps": 33920, "loss": 0.3798, "lr": 8.702335844872946e-06, "epoch": 6.223466981132075, "percentage": 31.12, "elapsed_time": "0:19:47", "remaining_time": "0:43:49", "throughput": 5787.76, "total_tokens": 6874720} {"current_steps": 10560, "total_steps": 33920, "loss": 0.4181, "lr": 8.700606252904293e-06, "epoch": 6.226415094339623, "percentage": 31.13, "elapsed_time": "0:19:48", "remaining_time": "0:43:48", "throughput": 5788.06, "total_tokens": 6877984} {"current_steps": 10565, "total_steps": 33920, "loss": 0.4209, "lr": 8.698875681184183e-06, "epoch": 6.22936320754717, "percentage": 31.15, "elapsed_time": "0:19:48", "remaining_time": "0:43:48", "throughput": 5788.4, "total_tokens": 6881504} {"current_steps": 10570, "total_steps": 33920, "loss": 0.4598, "lr": 8.697144130170797e-06, "epoch": 6.232311320754717, "percentage": 31.16, "elapsed_time": "0:19:49", "remaining_time": "0:43:47", "throughput": 5788.65, "total_tokens": 6884832} {"current_steps": 10575, "total_steps": 33920, "loss": 0.4888, "lr": 8.695411600322568e-06, "epoch": 6.2352594339622645, "percentage": 31.18, "elapsed_time": "0:19:49", "remaining_time": "0:43:46", "throughput": 5788.65, "total_tokens": 6887648} {"current_steps": 10580, "total_steps": 33920, "loss": 0.3685, "lr": 8.693678092098191e-06, "epoch": 6.238207547169812, "percentage": 31.19, "elapsed_time": "0:19:50", "remaining_time": "0:43:45", "throughput": 5788.68, "total_tokens": 6890528} {"current_steps": 10585, "total_steps": 33920, "loss": 0.4171, "lr": 8.691943605956621e-06, "epoch": 6.241155660377358, "percentage": 31.21, "elapsed_time": "0:19:50", "remaining_time": "0:43:45", "throughput": 5788.95, "total_tokens": 6894112} {"current_steps": 10590, "total_steps": 33920, "loss": 0.4101, "lr": 8.690208142357069e-06, "epoch": 6.244103773584905, "percentage": 31.22, "elapsed_time": "0:19:51", "remaining_time": "0:43:44", "throughput": 5789.26, "total_tokens": 6897440} {"current_steps": 10595, "total_steps": 33920, "loss": 0.3522, "lr": 8.68847170175901e-06, "epoch": 6.247051886792453, "percentage": 31.24, "elapsed_time": "0:19:51", "remaining_time": "0:43:44", "throughput": 5789.65, "total_tokens": 6901088} {"current_steps": 10600, "total_steps": 33920, "loss": 0.3493, "lr": 8.686734284622168e-06, "epoch": 6.25, "percentage": 31.25, "elapsed_time": "0:19:52", "remaining_time": "0:43:43", "throughput": 5789.55, "total_tokens": 6903712} {"current_steps": 10605, "total_steps": 33920, "loss": 0.3964, "lr": 8.684995891406537e-06, "epoch": 6.252948113207547, "percentage": 31.26, "elapsed_time": "0:19:52", "remaining_time": "0:43:42", "throughput": 5789.74, "total_tokens": 6906912} {"current_steps": 10610, "total_steps": 33920, "loss": 0.5167, "lr": 8.683256522572362e-06, "epoch": 6.255896226415095, "percentage": 31.28, "elapsed_time": "0:19:53", "remaining_time": "0:43:41", "throughput": 5789.68, "total_tokens": 6909536} {"current_steps": 10615, "total_steps": 33920, "loss": 0.3299, "lr": 8.68151617858015e-06, "epoch": 6.258844339622642, "percentage": 31.29, "elapsed_time": "0:19:53", "remaining_time": "0:43:41", "throughput": 5789.61, "total_tokens": 6912320} {"current_steps": 10620, "total_steps": 33920, "loss": 0.4186, "lr": 8.67977485989066e-06, "epoch": 6.261792452830189, "percentage": 31.31, "elapsed_time": "0:19:54", "remaining_time": "0:43:40", "throughput": 5789.72, "total_tokens": 6915456} {"current_steps": 10625, "total_steps": 33920, "loss": 0.467, "lr": 8.67803256696492e-06, "epoch": 6.2647405660377355, "percentage": 31.32, "elapsed_time": "0:19:55", "remaining_time": "0:43:40", "throughput": 5790.14, "total_tokens": 6919328} {"current_steps": 10630, "total_steps": 33920, "loss": 0.4627, "lr": 8.676289300264205e-06, "epoch": 6.267688679245283, "percentage": 31.34, "elapsed_time": "0:19:55", "remaining_time": "0:43:39", "throughput": 5790.6, "total_tokens": 6923104} {"current_steps": 10635, "total_steps": 33920, "loss": 0.4379, "lr": 8.674545060250054e-06, "epoch": 6.27063679245283, "percentage": 31.35, "elapsed_time": "0:19:56", "remaining_time": "0:43:38", "throughput": 5790.44, "total_tokens": 6926048} {"current_steps": 10640, "total_steps": 33920, "loss": 0.3809, "lr": 8.672799847384263e-06, "epoch": 6.273584905660377, "percentage": 31.37, "elapsed_time": "0:19:56", "remaining_time": "0:43:38", "throughput": 5790.57, "total_tokens": 6929792} {"current_steps": 10645, "total_steps": 33920, "loss": 0.4686, "lr": 8.671053662128883e-06, "epoch": 6.276533018867925, "percentage": 31.38, "elapsed_time": "0:19:57", "remaining_time": "0:43:37", "throughput": 5790.67, "total_tokens": 6932736} {"current_steps": 10650, "total_steps": 33920, "loss": 0.4657, "lr": 8.669306504946223e-06, "epoch": 6.279481132075472, "percentage": 31.4, "elapsed_time": "0:19:57", "remaining_time": "0:43:37", "throughput": 5790.9, "total_tokens": 6936032} {"current_steps": 10655, "total_steps": 33920, "loss": 0.4659, "lr": 8.667558376298854e-06, "epoch": 6.282429245283019, "percentage": 31.41, "elapsed_time": "0:19:58", "remaining_time": "0:43:36", "throughput": 5790.95, "total_tokens": 6939136} {"current_steps": 10660, "total_steps": 33920, "loss": 0.3539, "lr": 8.665809276649597e-06, "epoch": 6.285377358490566, "percentage": 31.43, "elapsed_time": "0:19:58", "remaining_time": "0:43:35", "throughput": 5791.24, "total_tokens": 6942656} {"current_steps": 10665, "total_steps": 33920, "loss": 0.5863, "lr": 8.664059206461537e-06, "epoch": 6.288325471698113, "percentage": 31.44, "elapsed_time": "0:19:59", "remaining_time": "0:43:35", "throughput": 5791.26, "total_tokens": 6945376} {"current_steps": 10670, "total_steps": 33920, "loss": 0.4993, "lr": 8.662308166198009e-06, "epoch": 6.29127358490566, "percentage": 31.46, "elapsed_time": "0:19:59", "remaining_time": "0:43:34", "throughput": 5791.36, "total_tokens": 6948448} {"current_steps": 10675, "total_steps": 33920, "loss": 0.4374, "lr": 8.660556156322611e-06, "epoch": 6.2942216981132075, "percentage": 31.47, "elapsed_time": "0:20:00", "remaining_time": "0:43:33", "throughput": 5791.31, "total_tokens": 6951008} {"current_steps": 10680, "total_steps": 33920, "loss": 0.319, "lr": 8.658803177299196e-06, "epoch": 6.297169811320755, "percentage": 31.49, "elapsed_time": "0:20:00", "remaining_time": "0:43:33", "throughput": 5791.37, "total_tokens": 6954400} {"current_steps": 10685, "total_steps": 33920, "loss": 0.4351, "lr": 8.65704922959187e-06, "epoch": 6.300117924528302, "percentage": 31.5, "elapsed_time": "0:20:01", "remaining_time": "0:43:32", "throughput": 5791.99, "total_tokens": 6959168} {"current_steps": 10690, "total_steps": 33920, "loss": 0.4923, "lr": 8.655294313664998e-06, "epoch": 6.303066037735849, "percentage": 31.52, "elapsed_time": "0:20:02", "remaining_time": "0:43:32", "throughput": 5792.49, "total_tokens": 6963456} {"current_steps": 10695, "total_steps": 33920, "loss": 0.381, "lr": 8.653538429983204e-06, "epoch": 6.306014150943396, "percentage": 31.53, "elapsed_time": "0:20:02", "remaining_time": "0:43:31", "throughput": 5792.91, "total_tokens": 6967232} {"current_steps": 10700, "total_steps": 33920, "loss": 0.3356, "lr": 8.651781579011366e-06, "epoch": 6.308962264150943, "percentage": 31.54, "elapsed_time": "0:20:03", "remaining_time": "0:43:31", "throughput": 5793.01, "total_tokens": 6970336} {"current_steps": 10705, "total_steps": 33920, "loss": 0.474, "lr": 8.650023761214615e-06, "epoch": 6.31191037735849, "percentage": 31.56, "elapsed_time": "0:20:03", "remaining_time": "0:43:30", "throughput": 5792.88, "total_tokens": 6973184} {"current_steps": 10710, "total_steps": 33920, "loss": 0.5343, "lr": 8.648264977058344e-06, "epoch": 6.314858490566038, "percentage": 31.57, "elapsed_time": "0:20:04", "remaining_time": "0:43:29", "throughput": 5793.07, "total_tokens": 6976480} {"current_steps": 10715, "total_steps": 33920, "loss": 0.5249, "lr": 8.646505227008197e-06, "epoch": 6.317806603773585, "percentage": 31.59, "elapsed_time": "0:20:04", "remaining_time": "0:43:29", "throughput": 5793.47, "total_tokens": 6980032} {"current_steps": 10720, "total_steps": 33920, "loss": 0.4217, "lr": 8.644744511530074e-06, "epoch": 6.320754716981132, "percentage": 31.6, "elapsed_time": "0:20:05", "remaining_time": "0:43:28", "throughput": 5793.65, "total_tokens": 6983296} {"current_steps": 10725, "total_steps": 33920, "loss": 0.5654, "lr": 8.642982831090135e-06, "epoch": 6.3237028301886795, "percentage": 31.62, "elapsed_time": "0:20:05", "remaining_time": "0:43:27", "throughput": 5793.98, "total_tokens": 6986784} {"current_steps": 10730, "total_steps": 33920, "loss": 0.5456, "lr": 8.64122018615479e-06, "epoch": 6.326650943396227, "percentage": 31.63, "elapsed_time": "0:20:06", "remaining_time": "0:43:27", "throughput": 5794.61, "total_tokens": 6991648} {"current_steps": 10735, "total_steps": 33920, "loss": 0.3512, "lr": 8.63945657719071e-06, "epoch": 6.329599056603773, "percentage": 31.65, "elapsed_time": "0:20:07", "remaining_time": "0:43:27", "throughput": 5794.77, "total_tokens": 6995104} {"current_steps": 10740, "total_steps": 33920, "loss": 0.3562, "lr": 8.637692004664816e-06, "epoch": 6.3325471698113205, "percentage": 31.66, "elapsed_time": "0:20:07", "remaining_time": "0:43:26", "throughput": 5794.56, "total_tokens": 6997504} {"current_steps": 10745, "total_steps": 33920, "loss": 0.5171, "lr": 8.635926469044284e-06, "epoch": 6.335495283018868, "percentage": 31.68, "elapsed_time": "0:20:08", "remaining_time": "0:43:25", "throughput": 5794.82, "total_tokens": 7001312} {"current_steps": 10750, "total_steps": 33920, "loss": 0.352, "lr": 8.63415997079655e-06, "epoch": 6.338443396226415, "percentage": 31.69, "elapsed_time": "0:20:08", "remaining_time": "0:43:25", "throughput": 5794.7, "total_tokens": 7004032} {"current_steps": 10755, "total_steps": 33920, "loss": 0.436, "lr": 8.6323925103893e-06, "epoch": 6.341391509433962, "percentage": 31.71, "elapsed_time": "0:20:09", "remaining_time": "0:43:24", "throughput": 5794.67, "total_tokens": 7006848} {"current_steps": 10760, "total_steps": 33920, "loss": 0.3455, "lr": 8.63062408829048e-06, "epoch": 6.34433962264151, "percentage": 31.72, "elapsed_time": "0:20:09", "remaining_time": "0:43:23", "throughput": 5794.68, "total_tokens": 7009600} {"current_steps": 10765, "total_steps": 33920, "loss": 0.3871, "lr": 8.628854704968285e-06, "epoch": 6.347287735849057, "percentage": 31.74, "elapsed_time": "0:20:10", "remaining_time": "0:43:22", "throughput": 5794.22, "total_tokens": 7011904} {"current_steps": 10770, "total_steps": 33920, "loss": 0.3823, "lr": 8.62708436089117e-06, "epoch": 6.350235849056604, "percentage": 31.75, "elapsed_time": "0:20:10", "remaining_time": "0:43:22", "throughput": 5794.44, "total_tokens": 7015168} {"current_steps": 10775, "total_steps": 33920, "loss": 0.3832, "lr": 8.625313056527836e-06, "epoch": 6.353183962264151, "percentage": 31.77, "elapsed_time": "0:20:11", "remaining_time": "0:43:21", "throughput": 5794.15, "total_tokens": 7017632} {"current_steps": 10780, "total_steps": 33920, "loss": 0.3014, "lr": 8.623540792347244e-06, "epoch": 6.356132075471698, "percentage": 31.78, "elapsed_time": "0:20:11", "remaining_time": "0:43:21", "throughput": 5794.68, "total_tokens": 7022304} {"current_steps": 10785, "total_steps": 33920, "loss": 0.5369, "lr": 8.621767568818614e-06, "epoch": 6.359080188679245, "percentage": 31.8, "elapsed_time": "0:20:12", "remaining_time": "0:43:20", "throughput": 5794.79, "total_tokens": 7025280} {"current_steps": 10790, "total_steps": 33920, "loss": 0.5328, "lr": 8.619993386411409e-06, "epoch": 6.3620283018867925, "percentage": 31.81, "elapsed_time": "0:20:12", "remaining_time": "0:43:20", "throughput": 5795.14, "total_tokens": 7029216} {"current_steps": 10795, "total_steps": 33920, "loss": 0.4641, "lr": 8.618218245595356e-06, "epoch": 6.36497641509434, "percentage": 31.82, "elapsed_time": "0:20:13", "remaining_time": "0:43:19", "throughput": 5795.21, "total_tokens": 7032192} {"current_steps": 10800, "total_steps": 33920, "loss": 0.477, "lr": 8.616442146840427e-06, "epoch": 6.367924528301887, "percentage": 31.84, "elapsed_time": "0:20:13", "remaining_time": "0:43:18", "throughput": 5795.13, "total_tokens": 7035072} {"current_steps": 10805, "total_steps": 33920, "loss": 0.4155, "lr": 8.614665090616854e-06, "epoch": 6.370872641509434, "percentage": 31.85, "elapsed_time": "0:20:14", "remaining_time": "0:43:18", "throughput": 5795.55, "total_tokens": 7039072} {"current_steps": 10810, "total_steps": 33920, "loss": 0.4178, "lr": 8.61288707739512e-06, "epoch": 6.373820754716981, "percentage": 31.87, "elapsed_time": "0:20:15", "remaining_time": "0:43:17", "throughput": 5796.13, "total_tokens": 7043584} {"current_steps": 10815, "total_steps": 33920, "loss": 0.4746, "lr": 8.611108107645963e-06, "epoch": 6.376768867924528, "percentage": 31.88, "elapsed_time": "0:20:15", "remaining_time": "0:43:17", "throughput": 5796.41, "total_tokens": 7047264} {"current_steps": 10820, "total_steps": 33920, "loss": 0.3146, "lr": 8.609328181840368e-06, "epoch": 6.379716981132075, "percentage": 31.9, "elapsed_time": "0:20:16", "remaining_time": "0:43:16", "throughput": 5796.62, "total_tokens": 7050528} {"current_steps": 10825, "total_steps": 33920, "loss": 0.4013, "lr": 8.607547300449585e-06, "epoch": 6.382665094339623, "percentage": 31.91, "elapsed_time": "0:20:16", "remaining_time": "0:43:16", "throughput": 5796.9, "total_tokens": 7053920} {"current_steps": 10830, "total_steps": 33920, "loss": 0.444, "lr": 8.605765463945105e-06, "epoch": 6.38561320754717, "percentage": 31.93, "elapsed_time": "0:20:17", "remaining_time": "0:43:15", "throughput": 5796.82, "total_tokens": 7056736} {"current_steps": 10835, "total_steps": 33920, "loss": 0.3847, "lr": 8.603982672798678e-06, "epoch": 6.388561320754717, "percentage": 31.94, "elapsed_time": "0:20:17", "remaining_time": "0:43:14", "throughput": 5796.67, "total_tokens": 7059616} {"current_steps": 10840, "total_steps": 33920, "loss": 0.4994, "lr": 8.602198927482309e-06, "epoch": 6.3915094339622645, "percentage": 31.96, "elapsed_time": "0:20:18", "remaining_time": "0:43:14", "throughput": 5797.11, "total_tokens": 7063424} {"current_steps": 10845, "total_steps": 33920, "loss": 0.3366, "lr": 8.600414228468245e-06, "epoch": 6.394457547169811, "percentage": 31.97, "elapsed_time": "0:20:19", "remaining_time": "0:43:13", "throughput": 5797.47, "total_tokens": 7067520} {"current_steps": 10850, "total_steps": 33920, "loss": 0.4935, "lr": 8.598628576229e-06, "epoch": 6.397405660377358, "percentage": 31.99, "elapsed_time": "0:20:19", "remaining_time": "0:43:13", "throughput": 5797.74, "total_tokens": 7070720} {"current_steps": 10855, "total_steps": 33920, "loss": 0.3289, "lr": 8.596841971237328e-06, "epoch": 6.400353773584905, "percentage": 32.0, "elapsed_time": "0:20:20", "remaining_time": "0:43:12", "throughput": 5798.15, "total_tokens": 7074656} {"current_steps": 10860, "total_steps": 33920, "loss": 0.4152, "lr": 8.595054413966246e-06, "epoch": 6.403301886792453, "percentage": 32.02, "elapsed_time": "0:20:20", "remaining_time": "0:43:11", "throughput": 5797.86, "total_tokens": 7077088} {"current_steps": 10865, "total_steps": 33920, "loss": 0.4701, "lr": 8.593265904889011e-06, "epoch": 6.40625, "percentage": 32.03, "elapsed_time": "0:20:21", "remaining_time": "0:43:11", "throughput": 5797.92, "total_tokens": 7080000} {"current_steps": 10870, "total_steps": 33920, "loss": 0.3213, "lr": 8.591476444479141e-06, "epoch": 6.409198113207547, "percentage": 32.05, "elapsed_time": "0:20:21", "remaining_time": "0:43:10", "throughput": 5797.95, "total_tokens": 7083072} {"current_steps": 10875, "total_steps": 33920, "loss": 0.4516, "lr": 8.589686033210407e-06, "epoch": 6.412146226415095, "percentage": 32.06, "elapsed_time": "0:20:22", "remaining_time": "0:43:09", "throughput": 5797.82, "total_tokens": 7085600} {"current_steps": 10880, "total_steps": 33920, "loss": 0.4884, "lr": 8.587894671556823e-06, "epoch": 6.415094339622642, "percentage": 32.08, "elapsed_time": "0:20:22", "remaining_time": "0:43:09", "throughput": 5797.92, "total_tokens": 7088960} {"current_steps": 10885, "total_steps": 33920, "loss": 0.4484, "lr": 8.586102359992663e-06, "epoch": 6.418042452830189, "percentage": 32.09, "elapsed_time": "0:20:23", "remaining_time": "0:43:08", "throughput": 5798.22, "total_tokens": 7092448} {"current_steps": 10890, "total_steps": 33920, "loss": 0.3753, "lr": 8.584309098992447e-06, "epoch": 6.4209905660377355, "percentage": 32.1, "elapsed_time": "0:20:23", "remaining_time": "0:43:07", "throughput": 5797.82, "total_tokens": 7094624} {"current_steps": 10895, "total_steps": 33920, "loss": 0.3845, "lr": 8.58251488903095e-06, "epoch": 6.423938679245283, "percentage": 32.12, "elapsed_time": "0:20:24", "remaining_time": "0:43:07", "throughput": 5797.52, "total_tokens": 7097120} {"current_steps": 10900, "total_steps": 33920, "loss": 0.3401, "lr": 8.580719730583196e-06, "epoch": 6.42688679245283, "percentage": 32.13, "elapsed_time": "0:20:24", "remaining_time": "0:43:06", "throughput": 5797.19, "total_tokens": 7099616} {"current_steps": 10905, "total_steps": 33920, "loss": 0.388, "lr": 8.578923624124462e-06, "epoch": 6.429834905660377, "percentage": 32.15, "elapsed_time": "0:20:25", "remaining_time": "0:43:05", "throughput": 5797.09, "total_tokens": 7102592} {"current_steps": 10910, "total_steps": 33920, "loss": 0.4829, "lr": 8.577126570130273e-06, "epoch": 6.432783018867925, "percentage": 32.16, "elapsed_time": "0:20:25", "remaining_time": "0:43:05", "throughput": 5796.91, "total_tokens": 7105024} {"current_steps": 10915, "total_steps": 33920, "loss": 0.3273, "lr": 8.575328569076408e-06, "epoch": 6.435731132075472, "percentage": 32.18, "elapsed_time": "0:20:26", "remaining_time": "0:43:04", "throughput": 5797.32, "total_tokens": 7109056} {"current_steps": 10920, "total_steps": 33920, "loss": 0.4052, "lr": 8.573529621438896e-06, "epoch": 6.438679245283019, "percentage": 32.19, "elapsed_time": "0:20:26", "remaining_time": "0:43:04", "throughput": 5797.98, "total_tokens": 7114080} {"current_steps": 10925, "total_steps": 33920, "loss": 0.437, "lr": 8.571729727694015e-06, "epoch": 6.441627358490566, "percentage": 32.21, "elapsed_time": "0:20:27", "remaining_time": "0:43:03", "throughput": 5798.43, "total_tokens": 7118016} {"current_steps": 10930, "total_steps": 33920, "loss": 0.4822, "lr": 8.569928888318298e-06, "epoch": 6.444575471698113, "percentage": 32.22, "elapsed_time": "0:20:28", "remaining_time": "0:43:03", "throughput": 5798.16, "total_tokens": 7120288} {"current_steps": 10935, "total_steps": 33920, "loss": 0.5622, "lr": 8.56812710378852e-06, "epoch": 6.44752358490566, "percentage": 32.24, "elapsed_time": "0:20:28", "remaining_time": "0:43:02", "throughput": 5798.21, "total_tokens": 7123200} {"current_steps": 10940, "total_steps": 33920, "loss": 0.3988, "lr": 8.566324374581714e-06, "epoch": 6.4504716981132075, "percentage": 32.25, "elapsed_time": "0:20:29", "remaining_time": "0:43:01", "throughput": 5798.19, "total_tokens": 7126336} {"current_steps": 10945, "total_steps": 33920, "loss": 0.4559, "lr": 8.564520701175158e-06, "epoch": 6.453419811320755, "percentage": 32.27, "elapsed_time": "0:20:29", "remaining_time": "0:43:01", "throughput": 5798.25, "total_tokens": 7129312} {"current_steps": 10950, "total_steps": 33920, "loss": 0.5083, "lr": 8.562716084046387e-06, "epoch": 6.456367924528302, "percentage": 32.28, "elapsed_time": "0:20:30", "remaining_time": "0:43:00", "throughput": 5798.56, "total_tokens": 7133088} {"current_steps": 10955, "total_steps": 33920, "loss": 0.4521, "lr": 8.560910523673177e-06, "epoch": 6.459316037735849, "percentage": 32.3, "elapsed_time": "0:20:30", "remaining_time": "0:43:00", "throughput": 5798.8, "total_tokens": 7137248} {"current_steps": 10960, "total_steps": 33920, "loss": 0.2731, "lr": 8.55910402053356e-06, "epoch": 6.462264150943396, "percentage": 32.31, "elapsed_time": "0:20:31", "remaining_time": "0:42:59", "throughput": 5799.29, "total_tokens": 7141312} {"current_steps": 10965, "total_steps": 33920, "loss": 0.5163, "lr": 8.557296575105814e-06, "epoch": 6.465212264150943, "percentage": 32.33, "elapsed_time": "0:20:32", "remaining_time": "0:42:59", "throughput": 5799.64, "total_tokens": 7145312} {"current_steps": 10970, "total_steps": 33920, "loss": 0.3538, "lr": 8.555488187868469e-06, "epoch": 6.46816037735849, "percentage": 32.34, "elapsed_time": "0:20:32", "remaining_time": "0:42:58", "throughput": 5799.54, "total_tokens": 7147840} {"current_steps": 10975, "total_steps": 33920, "loss": 0.3487, "lr": 8.5536788593003e-06, "epoch": 6.471108490566038, "percentage": 32.36, "elapsed_time": "0:20:33", "remaining_time": "0:42:58", "throughput": 5800.12, "total_tokens": 7152256} {"current_steps": 10980, "total_steps": 33920, "loss": 0.4033, "lr": 8.55186858988034e-06, "epoch": 6.474056603773585, "percentage": 32.37, "elapsed_time": "0:20:33", "remaining_time": "0:42:57", "throughput": 5800.06, "total_tokens": 7154976} {"current_steps": 10985, "total_steps": 33920, "loss": 0.525, "lr": 8.550057380087863e-06, "epoch": 6.477004716981132, "percentage": 32.39, "elapsed_time": "0:20:34", "remaining_time": "0:42:56", "throughput": 5800.2, "total_tokens": 7158112} {"current_steps": 10990, "total_steps": 33920, "loss": 0.4632, "lr": 8.548245230402396e-06, "epoch": 6.4799528301886795, "percentage": 32.4, "elapsed_time": "0:20:34", "remaining_time": "0:42:56", "throughput": 5800.66, "total_tokens": 7162240} {"current_steps": 10995, "total_steps": 33920, "loss": 0.4392, "lr": 8.546432141303711e-06, "epoch": 6.482900943396227, "percentage": 32.41, "elapsed_time": "0:20:35", "remaining_time": "0:42:55", "throughput": 5801.31, "total_tokens": 7166880} {"current_steps": 11000, "total_steps": 33920, "loss": 0.3647, "lr": 8.544618113271833e-06, "epoch": 6.485849056603773, "percentage": 32.43, "elapsed_time": "0:20:35", "remaining_time": "0:42:55", "throughput": 5801.64, "total_tokens": 7170496} {"current_steps": 11005, "total_steps": 33920, "loss": 0.5893, "lr": 8.542803146787032e-06, "epoch": 6.4887971698113205, "percentage": 32.44, "elapsed_time": "0:20:36", "remaining_time": "0:42:54", "throughput": 5802.04, "total_tokens": 7174144} {"current_steps": 11010, "total_steps": 33920, "loss": 0.4448, "lr": 8.54098724232983e-06, "epoch": 6.491745283018868, "percentage": 32.46, "elapsed_time": "0:20:36", "remaining_time": "0:42:53", "throughput": 5802.05, "total_tokens": 7176992} {"current_steps": 11015, "total_steps": 33920, "loss": 0.531, "lr": 8.539170400380994e-06, "epoch": 6.494693396226415, "percentage": 32.47, "elapsed_time": "0:20:37", "remaining_time": "0:42:53", "throughput": 5801.75, "total_tokens": 7179328} {"current_steps": 11020, "total_steps": 33920, "loss": 0.4361, "lr": 8.537352621421542e-06, "epoch": 6.497641509433962, "percentage": 32.49, "elapsed_time": "0:20:37", "remaining_time": "0:42:52", "throughput": 5801.65, "total_tokens": 7181952} {"current_steps": 11025, "total_steps": 33920, "loss": 0.4972, "lr": 8.535533905932739e-06, "epoch": 6.50058962264151, "percentage": 32.5, "elapsed_time": "0:20:38", "remaining_time": "0:42:51", "throughput": 5801.99, "total_tokens": 7185536} {"current_steps": 11030, "total_steps": 33920, "loss": 0.4412, "lr": 8.533714254396096e-06, "epoch": 6.503537735849057, "percentage": 32.52, "elapsed_time": "0:20:38", "remaining_time": "0:42:51", "throughput": 5801.97, "total_tokens": 7188288} {"current_steps": 11035, "total_steps": 33920, "loss": 0.4875, "lr": 8.531893667293375e-06, "epoch": 6.506485849056604, "percentage": 32.53, "elapsed_time": "0:20:39", "remaining_time": "0:42:50", "throughput": 5802.42, "total_tokens": 7192128} {"current_steps": 11040, "total_steps": 33920, "loss": 0.3171, "lr": 8.530072145106585e-06, "epoch": 6.509433962264151, "percentage": 32.55, "elapsed_time": "0:20:39", "remaining_time": "0:42:49", "throughput": 5802.53, "total_tokens": 7195104} {"current_steps": 11045, "total_steps": 33920, "loss": 0.3848, "lr": 8.528249688317978e-06, "epoch": 6.512382075471698, "percentage": 32.56, "elapsed_time": "0:20:40", "remaining_time": "0:42:49", "throughput": 5802.52, "total_tokens": 7197952} {"current_steps": 11050, "total_steps": 33920, "loss": 0.3133, "lr": 8.526426297410062e-06, "epoch": 6.515330188679245, "percentage": 32.58, "elapsed_time": "0:20:41", "remaining_time": "0:42:48", "throughput": 5802.7, "total_tokens": 7201216} {"current_steps": 11055, "total_steps": 33920, "loss": 0.402, "lr": 8.524601972865586e-06, "epoch": 6.5182783018867925, "percentage": 32.59, "elapsed_time": "0:20:41", "remaining_time": "0:42:48", "throughput": 5803.52, "total_tokens": 7207520} {"current_steps": 11060, "total_steps": 33920, "loss": 0.4625, "lr": 8.522776715167548e-06, "epoch": 6.52122641509434, "percentage": 32.61, "elapsed_time": "0:20:42", "remaining_time": "0:42:48", "throughput": 5803.99, "total_tokens": 7211712} {"current_steps": 11065, "total_steps": 33920, "loss": 0.2418, "lr": 8.520950524799192e-06, "epoch": 6.524174528301887, "percentage": 32.62, "elapsed_time": "0:20:43", "remaining_time": "0:42:47", "throughput": 5803.7, "total_tokens": 7214112} {"current_steps": 11070, "total_steps": 33920, "loss": 0.5313, "lr": 8.51912340224401e-06, "epoch": 6.527122641509434, "percentage": 32.64, "elapsed_time": "0:20:43", "remaining_time": "0:42:47", "throughput": 5803.93, "total_tokens": 7219616} {"current_steps": 11075, "total_steps": 33920, "loss": 0.3658, "lr": 8.51729534798574e-06, "epoch": 6.530070754716981, "percentage": 32.65, "elapsed_time": "0:20:44", "remaining_time": "0:42:46", "throughput": 5803.89, "total_tokens": 7222240} {"current_steps": 11080, "total_steps": 33920, "loss": 0.4608, "lr": 8.515466362508369e-06, "epoch": 6.533018867924528, "percentage": 32.67, "elapsed_time": "0:20:44", "remaining_time": "0:42:46", "throughput": 5803.78, "total_tokens": 7224832} {"current_steps": 11085, "total_steps": 33920, "loss": 0.3542, "lr": 8.513636446296125e-06, "epoch": 6.535966981132075, "percentage": 32.68, "elapsed_time": "0:20:45", "remaining_time": "0:42:45", "throughput": 5803.74, "total_tokens": 7227648} {"current_steps": 11090, "total_steps": 33920, "loss": 0.4697, "lr": 8.51180559983349e-06, "epoch": 6.538915094339623, "percentage": 32.69, "elapsed_time": "0:20:45", "remaining_time": "0:42:44", "throughput": 5803.98, "total_tokens": 7231328} {"current_steps": 11095, "total_steps": 33920, "loss": 0.4618, "lr": 8.50997382360519e-06, "epoch": 6.54186320754717, "percentage": 32.71, "elapsed_time": "0:20:46", "remaining_time": "0:42:44", "throughput": 5804.14, "total_tokens": 7234592} {"current_steps": 11100, "total_steps": 33920, "loss": 0.5463, "lr": 8.508141118096191e-06, "epoch": 6.544811320754717, "percentage": 32.72, "elapsed_time": "0:20:46", "remaining_time": "0:42:43", "throughput": 5804.24, "total_tokens": 7237600} {"current_steps": 11105, "total_steps": 33920, "loss": 0.3954, "lr": 8.506307483791712e-06, "epoch": 6.5477594339622645, "percentage": 32.74, "elapsed_time": "0:20:47", "remaining_time": "0:42:42", "throughput": 5804.18, "total_tokens": 7240416} {"current_steps": 11110, "total_steps": 33920, "loss": 0.3508, "lr": 8.504472921177215e-06, "epoch": 6.550707547169811, "percentage": 32.75, "elapsed_time": "0:20:47", "remaining_time": "0:42:42", "throughput": 5803.94, "total_tokens": 7243104} {"current_steps": 11115, "total_steps": 33920, "loss": 0.5178, "lr": 8.502637430738409e-06, "epoch": 6.553655660377358, "percentage": 32.77, "elapsed_time": "0:20:48", "remaining_time": "0:42:41", "throughput": 5804.15, "total_tokens": 7246336} {"current_steps": 11120, "total_steps": 33920, "loss": 0.4293, "lr": 8.500801012961248e-06, "epoch": 6.556603773584905, "percentage": 32.78, "elapsed_time": "0:20:48", "remaining_time": "0:42:40", "throughput": 5804.14, "total_tokens": 7249152} {"current_steps": 11125, "total_steps": 33920, "loss": 0.4648, "lr": 8.49896366833193e-06, "epoch": 6.559551886792453, "percentage": 32.8, "elapsed_time": "0:20:49", "remaining_time": "0:42:40", "throughput": 5804.23, "total_tokens": 7252192} {"current_steps": 11130, "total_steps": 33920, "loss": 0.3835, "lr": 8.497125397336903e-06, "epoch": 6.5625, "percentage": 32.81, "elapsed_time": "0:20:49", "remaining_time": "0:42:39", "throughput": 5804.27, "total_tokens": 7255232} {"current_steps": 11135, "total_steps": 33920, "loss": 0.4251, "lr": 8.495286200462854e-06, "epoch": 6.565448113207547, "percentage": 32.83, "elapsed_time": "0:20:50", "remaining_time": "0:42:38", "throughput": 5804.18, "total_tokens": 7258016} {"current_steps": 11140, "total_steps": 33920, "loss": 0.3453, "lr": 8.49344607819672e-06, "epoch": 6.568396226415095, "percentage": 32.84, "elapsed_time": "0:20:50", "remaining_time": "0:42:38", "throughput": 5803.74, "total_tokens": 7260384} {"current_steps": 11145, "total_steps": 33920, "loss": 0.5215, "lr": 8.49160503102568e-06, "epoch": 6.571344339622642, "percentage": 32.86, "elapsed_time": "0:20:51", "remaining_time": "0:42:37", "throughput": 5803.75, "total_tokens": 7263264} {"current_steps": 11150, "total_steps": 33920, "loss": 0.4045, "lr": 8.489763059437161e-06, "epoch": 6.574292452830189, "percentage": 32.87, "elapsed_time": "0:20:51", "remaining_time": "0:42:36", "throughput": 5803.89, "total_tokens": 7266464} {"current_steps": 11155, "total_steps": 33920, "loss": 0.3774, "lr": 8.487920163918833e-06, "epoch": 6.5772405660377355, "percentage": 32.89, "elapsed_time": "0:20:52", "remaining_time": "0:42:36", "throughput": 5803.68, "total_tokens": 7269472} {"current_steps": 11160, "total_steps": 33920, "loss": 0.4179, "lr": 8.486076344958607e-06, "epoch": 6.580188679245283, "percentage": 32.9, "elapsed_time": "0:20:53", "remaining_time": "0:42:35", "throughput": 5804.19, "total_tokens": 7273632} {"current_steps": 11165, "total_steps": 33920, "loss": 0.4313, "lr": 8.484231603044647e-06, "epoch": 6.58313679245283, "percentage": 32.92, "elapsed_time": "0:20:53", "remaining_time": "0:42:35", "throughput": 5804.47, "total_tokens": 7277344} {"current_steps": 11170, "total_steps": 33920, "loss": 0.283, "lr": 8.482385938665352e-06, "epoch": 6.586084905660377, "percentage": 32.93, "elapsed_time": "0:20:54", "remaining_time": "0:42:34", "throughput": 5804.45, "total_tokens": 7280128} {"current_steps": 11175, "total_steps": 33920, "loss": 0.4056, "lr": 8.480539352309373e-06, "epoch": 6.589033018867925, "percentage": 32.95, "elapsed_time": "0:20:54", "remaining_time": "0:42:33", "throughput": 5804.57, "total_tokens": 7283648} {"current_steps": 11180, "total_steps": 33920, "loss": 0.4323, "lr": 8.478691844465598e-06, "epoch": 6.591981132075472, "percentage": 32.96, "elapsed_time": "0:20:55", "remaining_time": "0:42:33", "throughput": 5804.47, "total_tokens": 7286272} {"current_steps": 11185, "total_steps": 33920, "loss": 0.3752, "lr": 8.476843415623168e-06, "epoch": 6.594929245283019, "percentage": 32.97, "elapsed_time": "0:20:55", "remaining_time": "0:42:32", "throughput": 5804.62, "total_tokens": 7289568} {"current_steps": 11190, "total_steps": 33920, "loss": 0.5469, "lr": 8.474994066271458e-06, "epoch": 6.597877358490566, "percentage": 32.99, "elapsed_time": "0:20:56", "remaining_time": "0:42:32", "throughput": 5804.96, "total_tokens": 7293696} {"current_steps": 11195, "total_steps": 33920, "loss": 0.5029, "lr": 8.473143796900089e-06, "epoch": 6.600825471698113, "percentage": 33.0, "elapsed_time": "0:20:56", "remaining_time": "0:42:31", "throughput": 5804.58, "total_tokens": 7296160} {"current_steps": 11200, "total_steps": 33920, "loss": 0.5805, "lr": 8.471292607998936e-06, "epoch": 6.60377358490566, "percentage": 33.02, "elapsed_time": "0:20:57", "remaining_time": "0:42:31", "throughput": 5804.94, "total_tokens": 7299936} {"current_steps": 11205, "total_steps": 33920, "loss": 0.4418, "lr": 8.469440500058104e-06, "epoch": 6.6067216981132075, "percentage": 33.03, "elapsed_time": "0:20:58", "remaining_time": "0:42:30", "throughput": 5805.82, "total_tokens": 7305664} {"current_steps": 11210, "total_steps": 33920, "loss": 0.6698, "lr": 8.467587473567945e-06, "epoch": 6.609669811320755, "percentage": 33.05, "elapsed_time": "0:20:58", "remaining_time": "0:42:30", "throughput": 5806.09, "total_tokens": 7309472} {"current_steps": 11215, "total_steps": 33920, "loss": 0.342, "lr": 8.46573352901906e-06, "epoch": 6.612617924528302, "percentage": 33.06, "elapsed_time": "0:20:59", "remaining_time": "0:42:29", "throughput": 5806.45, "total_tokens": 7313152} {"current_steps": 11220, "total_steps": 33920, "loss": 0.4557, "lr": 8.463878666902286e-06, "epoch": 6.615566037735849, "percentage": 33.08, "elapsed_time": "0:21:00", "remaining_time": "0:42:29", "throughput": 5807.09, "total_tokens": 7318112} {"current_steps": 11225, "total_steps": 33920, "loss": 0.3286, "lr": 8.462022887708706e-06, "epoch": 6.618514150943396, "percentage": 33.09, "elapsed_time": "0:21:00", "remaining_time": "0:42:28", "throughput": 5806.9, "total_tokens": 7320800} {"current_steps": 11230, "total_steps": 33920, "loss": 0.4098, "lr": 8.460166191929646e-06, "epoch": 6.621462264150943, "percentage": 33.11, "elapsed_time": "0:21:01", "remaining_time": "0:42:28", "throughput": 5807.23, "total_tokens": 7324736} {"current_steps": 11235, "total_steps": 33920, "loss": 0.4455, "lr": 8.458308580056675e-06, "epoch": 6.62441037735849, "percentage": 33.12, "elapsed_time": "0:21:01", "remaining_time": "0:42:27", "throughput": 5807.51, "total_tokens": 7328352} {"current_steps": 11240, "total_steps": 33920, "loss": 0.4135, "lr": 8.456450052581602e-06, "epoch": 6.627358490566038, "percentage": 33.14, "elapsed_time": "0:21:02", "remaining_time": "0:42:27", "throughput": 5807.9, "total_tokens": 7332064} {"current_steps": 11245, "total_steps": 33920, "loss": 0.5028, "lr": 8.45459060999648e-06, "epoch": 6.630306603773585, "percentage": 33.15, "elapsed_time": "0:21:03", "remaining_time": "0:42:26", "throughput": 5808.2, "total_tokens": 7336224} {"current_steps": 11250, "total_steps": 33920, "loss": 0.5647, "lr": 8.452730252793608e-06, "epoch": 6.633254716981132, "percentage": 33.17, "elapsed_time": "0:21:03", "remaining_time": "0:42:26", "throughput": 5808.36, "total_tokens": 7339424} {"current_steps": 11255, "total_steps": 33920, "loss": 0.3141, "lr": 8.450868981465519e-06, "epoch": 6.6362028301886795, "percentage": 33.18, "elapsed_time": "0:21:04", "remaining_time": "0:42:25", "throughput": 5808.53, "total_tokens": 7342912} {"current_steps": 11260, "total_steps": 33920, "loss": 0.3394, "lr": 8.449006796504997e-06, "epoch": 6.639150943396227, "percentage": 33.2, "elapsed_time": "0:21:04", "remaining_time": "0:42:24", "throughput": 5808.2, "total_tokens": 7345216} {"current_steps": 11265, "total_steps": 33920, "loss": 0.4621, "lr": 8.44714369840506e-06, "epoch": 6.642099056603773, "percentage": 33.21, "elapsed_time": "0:21:05", "remaining_time": "0:42:24", "throughput": 5808.47, "total_tokens": 7348736} {"current_steps": 11270, "total_steps": 33920, "loss": 0.3726, "lr": 8.445279687658973e-06, "epoch": 6.6450471698113205, "percentage": 33.23, "elapsed_time": "0:21:05", "remaining_time": "0:42:23", "throughput": 5808.44, "total_tokens": 7351616} {"current_steps": 11275, "total_steps": 33920, "loss": 0.3986, "lr": 8.44341476476024e-06, "epoch": 6.647995283018868, "percentage": 33.24, "elapsed_time": "0:21:06", "remaining_time": "0:42:24", "throughput": 5809.06, "total_tokens": 7359168} {"current_steps": 11280, "total_steps": 33920, "loss": 0.403, "lr": 8.441548930202608e-06, "epoch": 6.650943396226415, "percentage": 33.25, "elapsed_time": "0:21:07", "remaining_time": "0:42:23", "throughput": 5808.99, "total_tokens": 7361984} {"current_steps": 11285, "total_steps": 33920, "loss": 0.4786, "lr": 8.439682184480065e-06, "epoch": 6.653891509433962, "percentage": 33.27, "elapsed_time": "0:21:07", "remaining_time": "0:42:23", "throughput": 5809.03, "total_tokens": 7365216} {"current_steps": 11290, "total_steps": 33920, "loss": 0.5055, "lr": 8.437814528086837e-06, "epoch": 6.65683962264151, "percentage": 33.28, "elapsed_time": "0:21:08", "remaining_time": "0:42:22", "throughput": 5809.25, "total_tokens": 7368512} {"current_steps": 11295, "total_steps": 33920, "loss": 0.4474, "lr": 8.435945961517398e-06, "epoch": 6.659787735849057, "percentage": 33.3, "elapsed_time": "0:21:08", "remaining_time": "0:42:21", "throughput": 5808.93, "total_tokens": 7371040} {"current_steps": 11300, "total_steps": 33920, "loss": 0.4074, "lr": 8.434076485266458e-06, "epoch": 6.662735849056604, "percentage": 33.31, "elapsed_time": "0:21:09", "remaining_time": "0:42:21", "throughput": 5809.09, "total_tokens": 7374496} {"current_steps": 11305, "total_steps": 33920, "loss": 0.5354, "lr": 8.432206099828969e-06, "epoch": 6.665683962264151, "percentage": 33.33, "elapsed_time": "0:21:10", "remaining_time": "0:42:20", "throughput": 5809.39, "total_tokens": 7378112} {"current_steps": 11310, "total_steps": 33920, "loss": 0.3799, "lr": 8.430334805700122e-06, "epoch": 6.668632075471698, "percentage": 33.34, "elapsed_time": "0:21:10", "remaining_time": "0:42:20", "throughput": 5809.75, "total_tokens": 7381792} {"current_steps": 11315, "total_steps": 33920, "loss": 0.5497, "lr": 8.428462603375351e-06, "epoch": 6.671580188679245, "percentage": 33.36, "elapsed_time": "0:21:11", "remaining_time": "0:42:19", "throughput": 5809.61, "total_tokens": 7384384} {"current_steps": 11320, "total_steps": 33920, "loss": 0.5424, "lr": 8.426589493350332e-06, "epoch": 6.6745283018867925, "percentage": 33.37, "elapsed_time": "0:21:11", "remaining_time": "0:42:18", "throughput": 5809.86, "total_tokens": 7388032} {"current_steps": 11325, "total_steps": 33920, "loss": 0.6295, "lr": 8.424715476120976e-06, "epoch": 6.67747641509434, "percentage": 33.39, "elapsed_time": "0:21:12", "remaining_time": "0:42:18", "throughput": 5809.95, "total_tokens": 7391136} {"current_steps": 11330, "total_steps": 33920, "loss": 0.5037, "lr": 8.422840552183437e-06, "epoch": 6.680424528301887, "percentage": 33.4, "elapsed_time": "0:21:12", "remaining_time": "0:42:17", "throughput": 5810.02, "total_tokens": 7394560} {"current_steps": 11335, "total_steps": 33920, "loss": 0.3815, "lr": 8.420964722034111e-06, "epoch": 6.683372641509434, "percentage": 33.42, "elapsed_time": "0:21:13", "remaining_time": "0:42:17", "throughput": 5810.3, "total_tokens": 7398208} {"current_steps": 11340, "total_steps": 33920, "loss": 0.4193, "lr": 8.41908798616963e-06, "epoch": 6.686320754716981, "percentage": 33.43, "elapsed_time": "0:21:13", "remaining_time": "0:42:16", "throughput": 5810.49, "total_tokens": 7401600} {"current_steps": 11345, "total_steps": 33920, "loss": 0.3391, "lr": 8.41721034508687e-06, "epoch": 6.689268867924528, "percentage": 33.45, "elapsed_time": "0:21:14", "remaining_time": "0:42:16", "throughput": 5810.53, "total_tokens": 7405504} {"current_steps": 11350, "total_steps": 33920, "loss": 0.3748, "lr": 8.415331799282942e-06, "epoch": 6.692216981132075, "percentage": 33.46, "elapsed_time": "0:21:14", "remaining_time": "0:42:15", "throughput": 5810.42, "total_tokens": 7408192} {"current_steps": 11355, "total_steps": 33920, "loss": 0.4104, "lr": 8.413452349255205e-06, "epoch": 6.695165094339623, "percentage": 33.48, "elapsed_time": "0:21:15", "remaining_time": "0:42:14", "throughput": 5809.93, "total_tokens": 7410752} {"current_steps": 11360, "total_steps": 33920, "loss": 0.4477, "lr": 8.411571995501245e-06, "epoch": 6.69811320754717, "percentage": 33.49, "elapsed_time": "0:21:15", "remaining_time": "0:42:14", "throughput": 5809.88, "total_tokens": 7413376} {"current_steps": 11365, "total_steps": 33920, "loss": 0.5333, "lr": 8.409690738518895e-06, "epoch": 6.701061320754717, "percentage": 33.51, "elapsed_time": "0:21:16", "remaining_time": "0:42:13", "throughput": 5810.23, "total_tokens": 7417344} {"current_steps": 11370, "total_steps": 33920, "loss": 0.3967, "lr": 8.407808578806229e-06, "epoch": 6.7040094339622645, "percentage": 33.52, "elapsed_time": "0:21:17", "remaining_time": "0:42:12", "throughput": 5810.34, "total_tokens": 7420608} {"current_steps": 11375, "total_steps": 33920, "loss": 0.3422, "lr": 8.405925516861555e-06, "epoch": 6.706957547169811, "percentage": 33.53, "elapsed_time": "0:21:17", "remaining_time": "0:42:12", "throughput": 5810.51, "total_tokens": 7423840} {"current_steps": 11380, "total_steps": 33920, "loss": 0.4422, "lr": 8.40404155318342e-06, "epoch": 6.709905660377358, "percentage": 33.55, "elapsed_time": "0:21:18", "remaining_time": "0:42:11", "throughput": 5810.97, "total_tokens": 7427840} {"current_steps": 11385, "total_steps": 33920, "loss": 0.5032, "lr": 8.402156688270613e-06, "epoch": 6.712853773584905, "percentage": 33.56, "elapsed_time": "0:21:18", "remaining_time": "0:42:11", "throughput": 5811.07, "total_tokens": 7431328} {"current_steps": 11390, "total_steps": 33920, "loss": 0.4468, "lr": 8.400270922622162e-06, "epoch": 6.715801886792453, "percentage": 33.58, "elapsed_time": "0:21:19", "remaining_time": "0:42:10", "throughput": 5811.52, "total_tokens": 7435296} {"current_steps": 11395, "total_steps": 33920, "loss": 0.4916, "lr": 8.398384256737328e-06, "epoch": 6.71875, "percentage": 33.59, "elapsed_time": "0:21:19", "remaining_time": "0:42:10", "throughput": 5811.45, "total_tokens": 7438048} {"current_steps": 11400, "total_steps": 33920, "loss": 0.6071, "lr": 8.396496691115619e-06, "epoch": 6.721698113207547, "percentage": 33.61, "elapsed_time": "0:21:20", "remaining_time": "0:42:09", "throughput": 5811.48, "total_tokens": 7441088} {"current_steps": 11405, "total_steps": 33920, "loss": 0.4441, "lr": 8.39460822625677e-06, "epoch": 6.724646226415095, "percentage": 33.62, "elapsed_time": "0:21:20", "remaining_time": "0:42:08", "throughput": 5811.14, "total_tokens": 7443360} {"current_steps": 11410, "total_steps": 33920, "loss": 0.3033, "lr": 8.392718862660765e-06, "epoch": 6.727594339622642, "percentage": 33.64, "elapsed_time": "0:21:21", "remaining_time": "0:42:08", "throughput": 5811.67, "total_tokens": 7447616} {"current_steps": 11415, "total_steps": 33920, "loss": 0.4327, "lr": 8.390828600827818e-06, "epoch": 6.730542452830189, "percentage": 33.65, "elapsed_time": "0:21:21", "remaining_time": "0:42:07", "throughput": 5811.6, "total_tokens": 7450240} {"current_steps": 11420, "total_steps": 33920, "loss": 0.516, "lr": 8.388937441258385e-06, "epoch": 6.7334905660377355, "percentage": 33.67, "elapsed_time": "0:21:22", "remaining_time": "0:42:06", "throughput": 5811.76, "total_tokens": 7453664} {"current_steps": 11425, "total_steps": 33920, "loss": 0.4303, "lr": 8.387045384453162e-06, "epoch": 6.736438679245283, "percentage": 33.68, "elapsed_time": "0:21:23", "remaining_time": "0:42:06", "throughput": 5811.91, "total_tokens": 7456800} {"current_steps": 11430, "total_steps": 33920, "loss": 0.4387, "lr": 8.385152430913073e-06, "epoch": 6.73938679245283, "percentage": 33.7, "elapsed_time": "0:21:23", "remaining_time": "0:42:05", "throughput": 5811.88, "total_tokens": 7459648} {"current_steps": 11435, "total_steps": 33920, "loss": 0.4903, "lr": 8.383258581139288e-06, "epoch": 6.742334905660377, "percentage": 33.71, "elapsed_time": "0:21:24", "remaining_time": "0:42:04", "throughput": 5812.21, "total_tokens": 7463424} {"current_steps": 11440, "total_steps": 33920, "loss": 0.451, "lr": 8.381363835633213e-06, "epoch": 6.745283018867925, "percentage": 33.73, "elapsed_time": "0:21:24", "remaining_time": "0:42:04", "throughput": 5812.07, "total_tokens": 7466144} {"current_steps": 11445, "total_steps": 33920, "loss": 0.4346, "lr": 8.379468194896492e-06, "epoch": 6.748231132075472, "percentage": 33.74, "elapsed_time": "0:21:25", "remaining_time": "0:42:03", "throughput": 5812.09, "total_tokens": 7468992} {"current_steps": 11450, "total_steps": 33920, "loss": 0.5312, "lr": 8.377571659431e-06, "epoch": 6.751179245283019, "percentage": 33.76, "elapsed_time": "0:21:25", "remaining_time": "0:42:02", "throughput": 5812.32, "total_tokens": 7472288} {"current_steps": 11455, "total_steps": 33920, "loss": 0.4775, "lr": 8.375674229738855e-06, "epoch": 6.754127358490566, "percentage": 33.77, "elapsed_time": "0:21:26", "remaining_time": "0:42:02", "throughput": 5812.54, "total_tokens": 7475648} {"current_steps": 11460, "total_steps": 33920, "loss": 0.5368, "lr": 8.37377590632241e-06, "epoch": 6.757075471698113, "percentage": 33.79, "elapsed_time": "0:21:26", "remaining_time": "0:42:01", "throughput": 5812.69, "total_tokens": 7479712} {"current_steps": 11465, "total_steps": 33920, "loss": 0.454, "lr": 8.371876689684253e-06, "epoch": 6.76002358490566, "percentage": 33.8, "elapsed_time": "0:21:27", "remaining_time": "0:42:01", "throughput": 5812.75, "total_tokens": 7482688} {"current_steps": 11470, "total_steps": 33920, "loss": 0.3797, "lr": 8.369976580327211e-06, "epoch": 6.7629716981132075, "percentage": 33.81, "elapsed_time": "0:21:27", "remaining_time": "0:42:00", "throughput": 5813.03, "total_tokens": 7486176} {"current_steps": 11475, "total_steps": 33920, "loss": 0.4165, "lr": 8.368075578754345e-06, "epoch": 6.765919811320755, "percentage": 33.83, "elapsed_time": "0:21:28", "remaining_time": "0:41:59", "throughput": 5812.67, "total_tokens": 7488384} {"current_steps": 11480, "total_steps": 33920, "loss": 0.4835, "lr": 8.366173685468952e-06, "epoch": 6.768867924528302, "percentage": 33.84, "elapsed_time": "0:21:28", "remaining_time": "0:41:59", "throughput": 5812.87, "total_tokens": 7491680} {"current_steps": 11485, "total_steps": 33920, "loss": 0.3695, "lr": 8.364270900974572e-06, "epoch": 6.771816037735849, "percentage": 33.86, "elapsed_time": "0:21:29", "remaining_time": "0:41:58", "throughput": 5812.92, "total_tokens": 7494592} {"current_steps": 11490, "total_steps": 33920, "loss": 0.4804, "lr": 8.362367225774968e-06, "epoch": 6.774764150943396, "percentage": 33.87, "elapsed_time": "0:21:29", "remaining_time": "0:41:57", "throughput": 5813.04, "total_tokens": 7497632} {"current_steps": 11495, "total_steps": 33920, "loss": 0.4748, "lr": 8.360462660374153e-06, "epoch": 6.777712264150943, "percentage": 33.89, "elapsed_time": "0:21:30", "remaining_time": "0:41:57", "throughput": 5812.83, "total_tokens": 7500096} {"current_steps": 11500, "total_steps": 33920, "loss": 0.4511, "lr": 8.358557205276365e-06, "epoch": 6.78066037735849, "percentage": 33.9, "elapsed_time": "0:21:30", "remaining_time": "0:41:56", "throughput": 5812.98, "total_tokens": 7503392} {"current_steps": 11505, "total_steps": 33920, "loss": 0.3506, "lr": 8.356650860986083e-06, "epoch": 6.783608490566038, "percentage": 33.92, "elapsed_time": "0:21:31", "remaining_time": "0:41:55", "throughput": 5812.98, "total_tokens": 7506304} {"current_steps": 11510, "total_steps": 33920, "loss": 0.4215, "lr": 8.354743628008017e-06, "epoch": 6.786556603773585, "percentage": 33.93, "elapsed_time": "0:21:31", "remaining_time": "0:41:55", "throughput": 5813.11, "total_tokens": 7509376} {"current_steps": 11515, "total_steps": 33920, "loss": 0.547, "lr": 8.35283550684712e-06, "epoch": 6.789504716981132, "percentage": 33.95, "elapsed_time": "0:21:32", "remaining_time": "0:41:54", "throughput": 5813.13, "total_tokens": 7512480} {"current_steps": 11520, "total_steps": 33920, "loss": 0.586, "lr": 8.350926498008572e-06, "epoch": 6.7924528301886795, "percentage": 33.96, "elapsed_time": "0:21:32", "remaining_time": "0:41:53", "throughput": 5813.09, "total_tokens": 7515552} {"current_steps": 11525, "total_steps": 33920, "loss": 0.3822, "lr": 8.34901660199779e-06, "epoch": 6.795400943396227, "percentage": 33.98, "elapsed_time": "0:21:33", "remaining_time": "0:41:53", "throughput": 5813.14, "total_tokens": 7518656} {"current_steps": 11530, "total_steps": 33920, "loss": 0.4835, "lr": 8.347105819320432e-06, "epoch": 6.798349056603773, "percentage": 33.99, "elapsed_time": "0:21:33", "remaining_time": "0:41:52", "throughput": 5813.26, "total_tokens": 7521952} {"current_steps": 11535, "total_steps": 33920, "loss": 0.395, "lr": 8.34519415048238e-06, "epoch": 6.8012971698113205, "percentage": 34.01, "elapsed_time": "0:21:34", "remaining_time": "0:41:52", "throughput": 5813.43, "total_tokens": 7525376} {"current_steps": 11540, "total_steps": 33920, "loss": 0.3832, "lr": 8.343281595989761e-06, "epoch": 6.804245283018868, "percentage": 34.02, "elapsed_time": "0:21:34", "remaining_time": "0:41:51", "throughput": 5813.31, "total_tokens": 7528128} {"current_steps": 11545, "total_steps": 33920, "loss": 0.4204, "lr": 8.341368156348933e-06, "epoch": 6.807193396226415, "percentage": 34.04, "elapsed_time": "0:21:35", "remaining_time": "0:41:50", "throughput": 5813.43, "total_tokens": 7531328} {"current_steps": 11550, "total_steps": 33920, "loss": 0.4761, "lr": 8.339453832066482e-06, "epoch": 6.810141509433962, "percentage": 34.05, "elapsed_time": "0:21:35", "remaining_time": "0:41:50", "throughput": 5813.21, "total_tokens": 7533792} {"current_steps": 11555, "total_steps": 33920, "loss": 0.3677, "lr": 8.337538623649237e-06, "epoch": 6.81308962264151, "percentage": 34.07, "elapsed_time": "0:21:36", "remaining_time": "0:41:49", "throughput": 5813.34, "total_tokens": 7537216} {"current_steps": 11560, "total_steps": 33920, "loss": 0.5086, "lr": 8.33562253160426e-06, "epoch": 6.816037735849057, "percentage": 34.08, "elapsed_time": "0:21:37", "remaining_time": "0:41:48", "throughput": 5813.04, "total_tokens": 7539712} {"current_steps": 11565, "total_steps": 33920, "loss": 0.5623, "lr": 8.33370555643884e-06, "epoch": 6.818985849056604, "percentage": 34.09, "elapsed_time": "0:21:37", "remaining_time": "0:41:48", "throughput": 5813.15, "total_tokens": 7542848} {"current_steps": 11570, "total_steps": 33920, "loss": 0.3821, "lr": 8.331787698660507e-06, "epoch": 6.821933962264151, "percentage": 34.11, "elapsed_time": "0:21:38", "remaining_time": "0:41:47", "throughput": 5813.2, "total_tokens": 7545888} {"current_steps": 11575, "total_steps": 33920, "loss": 0.5281, "lr": 8.32986895877702e-06, "epoch": 6.824882075471698, "percentage": 34.12, "elapsed_time": "0:21:38", "remaining_time": "0:41:46", "throughput": 5813.27, "total_tokens": 7548864} {"current_steps": 11580, "total_steps": 33920, "loss": 0.3915, "lr": 8.327949337296378e-06, "epoch": 6.827830188679245, "percentage": 34.14, "elapsed_time": "0:21:39", "remaining_time": "0:41:46", "throughput": 5813.02, "total_tokens": 7551232} {"current_steps": 11585, "total_steps": 33920, "loss": 0.4711, "lr": 8.326028834726803e-06, "epoch": 6.8307783018867925, "percentage": 34.15, "elapsed_time": "0:21:39", "remaining_time": "0:41:45", "throughput": 5813.34, "total_tokens": 7555040} {"current_steps": 11590, "total_steps": 33920, "loss": 0.4952, "lr": 8.324107451576762e-06, "epoch": 6.83372641509434, "percentage": 34.17, "elapsed_time": "0:21:40", "remaining_time": "0:41:44", "throughput": 5813.06, "total_tokens": 7557664} {"current_steps": 11595, "total_steps": 33920, "loss": 0.4391, "lr": 8.322185188354947e-06, "epoch": 6.836674528301887, "percentage": 34.18, "elapsed_time": "0:21:40", "remaining_time": "0:41:44", "throughput": 5813.48, "total_tokens": 7561856} {"current_steps": 11600, "total_steps": 33920, "loss": 0.3429, "lr": 8.320262045570284e-06, "epoch": 6.839622641509434, "percentage": 34.2, "elapsed_time": "0:21:41", "remaining_time": "0:41:43", "throughput": 5813.7, "total_tokens": 7565248} {"current_steps": 11605, "total_steps": 33920, "loss": 0.3578, "lr": 8.318338023731937e-06, "epoch": 6.842570754716981, "percentage": 34.21, "elapsed_time": "0:21:41", "remaining_time": "0:41:43", "throughput": 5814.14, "total_tokens": 7569536} {"current_steps": 11610, "total_steps": 33920, "loss": 0.415, "lr": 8.316413123349296e-06, "epoch": 6.845518867924528, "percentage": 34.23, "elapsed_time": "0:21:42", "remaining_time": "0:41:42", "throughput": 5814.11, "total_tokens": 7572288} {"current_steps": 11615, "total_steps": 33920, "loss": 0.4335, "lr": 8.314487344931987e-06, "epoch": 6.848466981132075, "percentage": 34.24, "elapsed_time": "0:21:42", "remaining_time": "0:41:42", "throughput": 5814.28, "total_tokens": 7575520} {"current_steps": 11620, "total_steps": 33920, "loss": 0.4561, "lr": 8.31256068898987e-06, "epoch": 6.851415094339623, "percentage": 34.26, "elapsed_time": "0:21:43", "remaining_time": "0:41:41", "throughput": 5814.62, "total_tokens": 7579264} {"current_steps": 11625, "total_steps": 33920, "loss": 0.3629, "lr": 8.310633156033032e-06, "epoch": 6.85436320754717, "percentage": 34.27, "elapsed_time": "0:21:44", "remaining_time": "0:41:40", "throughput": 5814.74, "total_tokens": 7582496} {"current_steps": 11630, "total_steps": 33920, "loss": 0.4917, "lr": 8.3087047465718e-06, "epoch": 6.857311320754717, "percentage": 34.29, "elapsed_time": "0:21:44", "remaining_time": "0:41:40", "throughput": 5814.94, "total_tokens": 7586144} {"current_steps": 11635, "total_steps": 33920, "loss": 0.4278, "lr": 8.306775461116727e-06, "epoch": 6.8602594339622645, "percentage": 34.3, "elapsed_time": "0:21:45", "remaining_time": "0:41:39", "throughput": 5815.03, "total_tokens": 7589184} {"current_steps": 11640, "total_steps": 33920, "loss": 0.3716, "lr": 8.304845300178597e-06, "epoch": 6.863207547169811, "percentage": 34.32, "elapsed_time": "0:21:45", "remaining_time": "0:41:39", "throughput": 5815.1, "total_tokens": 7592480} {"current_steps": 11645, "total_steps": 33920, "loss": 0.4902, "lr": 8.302914264268433e-06, "epoch": 6.866155660377358, "percentage": 34.33, "elapsed_time": "0:21:46", "remaining_time": "0:41:38", "throughput": 5815.24, "total_tokens": 7595584} {"current_steps": 11650, "total_steps": 33920, "loss": 0.3334, "lr": 8.300982353897482e-06, "epoch": 6.869103773584905, "percentage": 34.35, "elapsed_time": "0:21:46", "remaining_time": "0:41:37", "throughput": 5815.48, "total_tokens": 7599008} {"current_steps": 11655, "total_steps": 33920, "loss": 0.4292, "lr": 8.299049569577226e-06, "epoch": 6.872051886792453, "percentage": 34.36, "elapsed_time": "0:21:47", "remaining_time": "0:41:37", "throughput": 5815.49, "total_tokens": 7601728} {"current_steps": 11660, "total_steps": 33920, "loss": 0.4201, "lr": 8.297115911819379e-06, "epoch": 6.875, "percentage": 34.38, "elapsed_time": "0:21:47", "remaining_time": "0:41:36", "throughput": 5815.32, "total_tokens": 7604288} {"current_steps": 11665, "total_steps": 33920, "loss": 0.4505, "lr": 8.295181381135884e-06, "epoch": 6.877948113207547, "percentage": 34.39, "elapsed_time": "0:21:48", "remaining_time": "0:41:35", "throughput": 5815.57, "total_tokens": 7607648} {"current_steps": 11670, "total_steps": 33920, "loss": 0.376, "lr": 8.293245978038917e-06, "epoch": 6.880896226415095, "percentage": 34.4, "elapsed_time": "0:21:48", "remaining_time": "0:41:35", "throughput": 5815.86, "total_tokens": 7611360} {"current_steps": 11675, "total_steps": 33920, "loss": 0.3271, "lr": 8.291309703040884e-06, "epoch": 6.883844339622642, "percentage": 34.42, "elapsed_time": "0:21:49", "remaining_time": "0:41:35", "throughput": 5816.42, "total_tokens": 7617664} {"current_steps": 11680, "total_steps": 33920, "loss": 0.4598, "lr": 8.289372556654422e-06, "epoch": 6.886792452830189, "percentage": 34.43, "elapsed_time": "0:21:50", "remaining_time": "0:41:34", "throughput": 5816.4, "total_tokens": 7620480} {"current_steps": 11685, "total_steps": 33920, "loss": 0.4873, "lr": 8.287434539392401e-06, "epoch": 6.8897405660377355, "percentage": 34.45, "elapsed_time": "0:21:50", "remaining_time": "0:41:34", "throughput": 5816.79, "total_tokens": 7624352} {"current_steps": 11690, "total_steps": 33920, "loss": 0.4431, "lr": 8.285495651767916e-06, "epoch": 6.892688679245283, "percentage": 34.46, "elapsed_time": "0:21:51", "remaining_time": "0:41:33", "throughput": 5816.76, "total_tokens": 7627296} {"current_steps": 11695, "total_steps": 33920, "loss": 0.4, "lr": 8.283555894294297e-06, "epoch": 6.89563679245283, "percentage": 34.48, "elapsed_time": "0:21:51", "remaining_time": "0:41:32", "throughput": 5816.89, "total_tokens": 7630816} {"current_steps": 11700, "total_steps": 33920, "loss": 0.5964, "lr": 8.281615267485105e-06, "epoch": 6.898584905660377, "percentage": 34.49, "elapsed_time": "0:21:52", "remaining_time": "0:41:32", "throughput": 5816.96, "total_tokens": 7633920} {"current_steps": 11705, "total_steps": 33920, "loss": 0.4768, "lr": 8.279673771854127e-06, "epoch": 6.901533018867925, "percentage": 34.51, "elapsed_time": "0:21:52", "remaining_time": "0:41:31", "throughput": 5817.33, "total_tokens": 7637920} {"current_steps": 11710, "total_steps": 33920, "loss": 0.541, "lr": 8.277731407915386e-06, "epoch": 6.904481132075472, "percentage": 34.52, "elapsed_time": "0:21:53", "remaining_time": "0:41:31", "throughput": 5817.36, "total_tokens": 7640800} {"current_steps": 11715, "total_steps": 33920, "loss": 0.3586, "lr": 8.275788176183126e-06, "epoch": 6.907429245283019, "percentage": 34.54, "elapsed_time": "0:21:54", "remaining_time": "0:41:30", "throughput": 5817.7, "total_tokens": 7644480} {"current_steps": 11720, "total_steps": 33920, "loss": 0.4119, "lr": 8.273844077171827e-06, "epoch": 6.910377358490566, "percentage": 34.55, "elapsed_time": "0:21:54", "remaining_time": "0:41:30", "throughput": 5817.91, "total_tokens": 7647936} {"current_steps": 11725, "total_steps": 33920, "loss": 0.4406, "lr": 8.271899111396202e-06, "epoch": 6.913325471698113, "percentage": 34.57, "elapsed_time": "0:21:55", "remaining_time": "0:41:29", "throughput": 5818.18, "total_tokens": 7651264} {"current_steps": 11730, "total_steps": 33920, "loss": 0.492, "lr": 8.269953279371185e-06, "epoch": 6.91627358490566, "percentage": 34.58, "elapsed_time": "0:21:55", "remaining_time": "0:41:28", "throughput": 5818.37, "total_tokens": 7654496} {"current_steps": 11735, "total_steps": 33920, "loss": 0.4332, "lr": 8.268006581611945e-06, "epoch": 6.9192216981132075, "percentage": 34.6, "elapsed_time": "0:21:56", "remaining_time": "0:41:28", "throughput": 5818.63, "total_tokens": 7657856} {"current_steps": 11740, "total_steps": 33920, "loss": 0.4429, "lr": 8.266059018633878e-06, "epoch": 6.922169811320755, "percentage": 34.61, "elapsed_time": "0:21:56", "remaining_time": "0:41:27", "throughput": 5818.4, "total_tokens": 7660192} {"current_steps": 11745, "total_steps": 33920, "loss": 0.3879, "lr": 8.264110590952609e-06, "epoch": 6.925117924528302, "percentage": 34.63, "elapsed_time": "0:21:57", "remaining_time": "0:41:26", "throughput": 5818.62, "total_tokens": 7663904} {"current_steps": 11750, "total_steps": 33920, "loss": 0.3115, "lr": 8.262161299083993e-06, "epoch": 6.928066037735849, "percentage": 34.64, "elapsed_time": "0:21:57", "remaining_time": "0:41:26", "throughput": 5818.6, "total_tokens": 7666688} {"current_steps": 11755, "total_steps": 33920, "loss": 0.3835, "lr": 8.260211143544117e-06, "epoch": 6.931014150943396, "percentage": 34.66, "elapsed_time": "0:21:58", "remaining_time": "0:41:25", "throughput": 5818.84, "total_tokens": 7670080} {"current_steps": 11760, "total_steps": 33920, "loss": 0.4932, "lr": 8.258260124849288e-06, "epoch": 6.933962264150943, "percentage": 34.67, "elapsed_time": "0:21:58", "remaining_time": "0:41:24", "throughput": 5818.83, "total_tokens": 7672768} {"current_steps": 11765, "total_steps": 33920, "loss": 0.3607, "lr": 8.256308243516048e-06, "epoch": 6.93691037735849, "percentage": 34.68, "elapsed_time": "0:21:59", "remaining_time": "0:41:24", "throughput": 5818.88, "total_tokens": 7675744} {"current_steps": 11770, "total_steps": 33920, "loss": 0.3709, "lr": 8.254355500061168e-06, "epoch": 6.939858490566038, "percentage": 34.7, "elapsed_time": "0:21:59", "remaining_time": "0:41:23", "throughput": 5818.72, "total_tokens": 7678400} {"current_steps": 11775, "total_steps": 33920, "loss": 0.6518, "lr": 8.252401895001643e-06, "epoch": 6.942806603773585, "percentage": 34.71, "elapsed_time": "0:22:00", "remaining_time": "0:41:22", "throughput": 5818.96, "total_tokens": 7681760} {"current_steps": 11780, "total_steps": 33920, "loss": 0.5036, "lr": 8.2504474288547e-06, "epoch": 6.945754716981132, "percentage": 34.73, "elapsed_time": "0:22:00", "remaining_time": "0:41:22", "throughput": 5818.95, "total_tokens": 7684480} {"current_steps": 11785, "total_steps": 33920, "loss": 0.4585, "lr": 8.248492102137791e-06, "epoch": 6.9487028301886795, "percentage": 34.74, "elapsed_time": "0:22:01", "remaining_time": "0:41:21", "throughput": 5818.55, "total_tokens": 7686816} {"current_steps": 11790, "total_steps": 33920, "loss": 0.4664, "lr": 8.246535915368596e-06, "epoch": 6.951650943396227, "percentage": 34.76, "elapsed_time": "0:22:01", "remaining_time": "0:41:20", "throughput": 5818.91, "total_tokens": 7691072} {"current_steps": 11795, "total_steps": 33920, "loss": 0.3612, "lr": 8.24457886906503e-06, "epoch": 6.954599056603773, "percentage": 34.77, "elapsed_time": "0:22:02", "remaining_time": "0:41:20", "throughput": 5819.33, "total_tokens": 7695168} {"current_steps": 11800, "total_steps": 33920, "loss": 0.3018, "lr": 8.242620963745222e-06, "epoch": 6.9575471698113205, "percentage": 34.79, "elapsed_time": "0:22:02", "remaining_time": "0:41:19", "throughput": 5819.56, "total_tokens": 7698560} {"current_steps": 11805, "total_steps": 33920, "loss": 0.4631, "lr": 8.240662199927538e-06, "epoch": 6.960495283018868, "percentage": 34.8, "elapsed_time": "0:22:03", "remaining_time": "0:41:19", "throughput": 5819.72, "total_tokens": 7702016} {"current_steps": 11810, "total_steps": 33920, "loss": 0.4655, "lr": 8.238702578130573e-06, "epoch": 6.963443396226415, "percentage": 34.82, "elapsed_time": "0:22:03", "remaining_time": "0:41:18", "throughput": 5819.83, "total_tokens": 7705376} {"current_steps": 11815, "total_steps": 33920, "loss": 0.6098, "lr": 8.23674209887314e-06, "epoch": 6.966391509433962, "percentage": 34.83, "elapsed_time": "0:22:04", "remaining_time": "0:41:17", "throughput": 5819.84, "total_tokens": 7708128} {"current_steps": 11820, "total_steps": 33920, "loss": 0.3823, "lr": 8.234780762674288e-06, "epoch": 6.96933962264151, "percentage": 34.85, "elapsed_time": "0:22:04", "remaining_time": "0:41:17", "throughput": 5820.26, "total_tokens": 7711776} {"current_steps": 11825, "total_steps": 33920, "loss": 0.4944, "lr": 8.232818570053286e-06, "epoch": 6.972287735849057, "percentage": 34.86, "elapsed_time": "0:22:05", "remaining_time": "0:41:16", "throughput": 5820.35, "total_tokens": 7714976} {"current_steps": 11830, "total_steps": 33920, "loss": 0.483, "lr": 8.230855521529637e-06, "epoch": 6.975235849056604, "percentage": 34.88, "elapsed_time": "0:22:06", "remaining_time": "0:41:16", "throughput": 5820.61, "total_tokens": 7718432} {"current_steps": 11835, "total_steps": 33920, "loss": 0.6142, "lr": 8.228891617623064e-06, "epoch": 6.978183962264151, "percentage": 34.89, "elapsed_time": "0:22:06", "remaining_time": "0:41:15", "throughput": 5820.3, "total_tokens": 7720640} {"current_steps": 11840, "total_steps": 33920, "loss": 0.4694, "lr": 8.22692685885352e-06, "epoch": 6.981132075471698, "percentage": 34.91, "elapsed_time": "0:22:06", "remaining_time": "0:41:14", "throughput": 5820.14, "total_tokens": 7723232} {"current_steps": 11845, "total_steps": 33920, "loss": 0.3445, "lr": 8.224961245741183e-06, "epoch": 6.984080188679245, "percentage": 34.92, "elapsed_time": "0:22:07", "remaining_time": "0:41:14", "throughput": 5820.65, "total_tokens": 7727712} {"current_steps": 11850, "total_steps": 33920, "loss": 0.4319, "lr": 8.222994778806457e-06, "epoch": 6.9870283018867925, "percentage": 34.94, "elapsed_time": "0:22:08", "remaining_time": "0:41:13", "throughput": 5820.71, "total_tokens": 7730816} {"current_steps": 11855, "total_steps": 33920, "loss": 0.511, "lr": 8.221027458569972e-06, "epoch": 6.98997641509434, "percentage": 34.95, "elapsed_time": "0:22:08", "remaining_time": "0:41:12", "throughput": 5821.07, "total_tokens": 7734336} {"current_steps": 11860, "total_steps": 33920, "loss": 0.4371, "lr": 8.219059285552586e-06, "epoch": 6.992924528301887, "percentage": 34.96, "elapsed_time": "0:22:09", "remaining_time": "0:41:12", "throughput": 5821.24, "total_tokens": 7737504} {"current_steps": 11865, "total_steps": 33920, "loss": 0.5436, "lr": 8.21709026027538e-06, "epoch": 6.995872641509434, "percentage": 34.98, "elapsed_time": "0:22:09", "remaining_time": "0:41:11", "throughput": 5821.74, "total_tokens": 7741952} {"current_steps": 11870, "total_steps": 33920, "loss": 0.4869, "lr": 8.215120383259664e-06, "epoch": 6.998820754716981, "percentage": 34.99, "elapsed_time": "0:22:10", "remaining_time": "0:41:11", "throughput": 5822.0, "total_tokens": 7745280} {"current_steps": 11875, "total_steps": 33920, "loss": 0.4837, "lr": 8.21314965502697e-06, "epoch": 7.001768867924528, "percentage": 35.01, "elapsed_time": "0:22:11", "remaining_time": "0:41:11", "throughput": 5820.45, "total_tokens": 7747712} {"current_steps": 11880, "total_steps": 33920, "loss": 0.3015, "lr": 8.211178076099056e-06, "epoch": 7.004716981132075, "percentage": 35.02, "elapsed_time": "0:22:11", "remaining_time": "0:41:10", "throughput": 5820.57, "total_tokens": 7750848} {"current_steps": 11885, "total_steps": 33920, "loss": 0.3273, "lr": 8.209205646997909e-06, "epoch": 7.007665094339623, "percentage": 35.04, "elapsed_time": "0:22:12", "remaining_time": "0:41:09", "throughput": 5820.92, "total_tokens": 7754688} {"current_steps": 11890, "total_steps": 33920, "loss": 0.3342, "lr": 8.207232368245735e-06, "epoch": 7.01061320754717, "percentage": 35.05, "elapsed_time": "0:22:12", "remaining_time": "0:41:09", "throughput": 5821.31, "total_tokens": 7758688} {"current_steps": 11895, "total_steps": 33920, "loss": 0.3225, "lr": 8.205258240364968e-06, "epoch": 7.013561320754717, "percentage": 35.07, "elapsed_time": "0:22:13", "remaining_time": "0:41:08", "throughput": 5821.51, "total_tokens": 7762048} {"current_steps": 11900, "total_steps": 33920, "loss": 0.3935, "lr": 8.203283263878268e-06, "epoch": 7.0165094339622645, "percentage": 35.08, "elapsed_time": "0:22:13", "remaining_time": "0:41:08", "throughput": 5821.29, "total_tokens": 7764448} {"current_steps": 11905, "total_steps": 33920, "loss": 0.3824, "lr": 8.201307439308518e-06, "epoch": 7.019457547169812, "percentage": 35.1, "elapsed_time": "0:22:14", "remaining_time": "0:41:07", "throughput": 5821.08, "total_tokens": 7766816} {"current_steps": 11910, "total_steps": 33920, "loss": 0.4043, "lr": 8.199330767178828e-06, "epoch": 7.022405660377358, "percentage": 35.11, "elapsed_time": "0:22:14", "remaining_time": "0:41:06", "throughput": 5821.43, "total_tokens": 7770688} {"current_steps": 11915, "total_steps": 33920, "loss": 0.5366, "lr": 8.19735324801253e-06, "epoch": 7.025353773584905, "percentage": 35.13, "elapsed_time": "0:22:15", "remaining_time": "0:41:06", "throughput": 5821.43, "total_tokens": 7773632} {"current_steps": 11920, "total_steps": 33920, "loss": 0.5753, "lr": 8.195374882333178e-06, "epoch": 7.028301886792453, "percentage": 35.14, "elapsed_time": "0:22:15", "remaining_time": "0:41:05", "throughput": 5821.3, "total_tokens": 7776224} {"current_steps": 11925, "total_steps": 33920, "loss": 0.4906, "lr": 8.193395670664555e-06, "epoch": 7.03125, "percentage": 35.16, "elapsed_time": "0:22:16", "remaining_time": "0:41:04", "throughput": 5821.09, "total_tokens": 7778816} {"current_steps": 11930, "total_steps": 33920, "loss": 0.4363, "lr": 8.191415613530667e-06, "epoch": 7.034198113207547, "percentage": 35.17, "elapsed_time": "0:22:16", "remaining_time": "0:41:04", "throughput": 5820.74, "total_tokens": 7781056} {"current_steps": 11935, "total_steps": 33920, "loss": 0.4459, "lr": 8.189434711455739e-06, "epoch": 7.037146226415095, "percentage": 35.19, "elapsed_time": "0:22:17", "remaining_time": "0:41:03", "throughput": 5820.84, "total_tokens": 7784064} {"current_steps": 11940, "total_steps": 33920, "loss": 0.416, "lr": 8.187452964964226e-06, "epoch": 7.040094339622642, "percentage": 35.2, "elapsed_time": "0:22:17", "remaining_time": "0:41:02", "throughput": 5821.09, "total_tokens": 7787616} {"current_steps": 11945, "total_steps": 33920, "loss": 0.5803, "lr": 8.185470374580805e-06, "epoch": 7.043042452830188, "percentage": 35.22, "elapsed_time": "0:22:18", "remaining_time": "0:41:02", "throughput": 5821.42, "total_tokens": 7791168} {"current_steps": 11950, "total_steps": 33920, "loss": 0.4739, "lr": 8.183486940830371e-06, "epoch": 7.0459905660377355, "percentage": 35.23, "elapsed_time": "0:22:18", "remaining_time": "0:41:01", "throughput": 5821.63, "total_tokens": 7794784} {"current_steps": 11955, "total_steps": 33920, "loss": 0.4084, "lr": 8.18150266423805e-06, "epoch": 7.048938679245283, "percentage": 35.24, "elapsed_time": "0:22:19", "remaining_time": "0:41:01", "throughput": 5821.73, "total_tokens": 7797984} {"current_steps": 11960, "total_steps": 33920, "loss": 0.4017, "lr": 8.179517545329188e-06, "epoch": 7.05188679245283, "percentage": 35.26, "elapsed_time": "0:22:20", "remaining_time": "0:41:00", "throughput": 5821.87, "total_tokens": 7801472} {"current_steps": 11965, "total_steps": 33920, "loss": 0.2901, "lr": 8.177531584629353e-06, "epoch": 7.054834905660377, "percentage": 35.27, "elapsed_time": "0:22:20", "remaining_time": "0:40:59", "throughput": 5821.55, "total_tokens": 7803808} {"current_steps": 11970, "total_steps": 33920, "loss": 0.4454, "lr": 8.175544782664335e-06, "epoch": 7.057783018867925, "percentage": 35.29, "elapsed_time": "0:22:21", "remaining_time": "0:40:59", "throughput": 5821.36, "total_tokens": 7806528} {"current_steps": 11975, "total_steps": 33920, "loss": 0.4679, "lr": 8.173557139960151e-06, "epoch": 7.060731132075472, "percentage": 35.3, "elapsed_time": "0:22:21", "remaining_time": "0:40:58", "throughput": 5821.31, "total_tokens": 7809856} {"current_steps": 11980, "total_steps": 33920, "loss": 0.3541, "lr": 8.17156865704304e-06, "epoch": 7.063679245283019, "percentage": 35.32, "elapsed_time": "0:22:22", "remaining_time": "0:40:58", "throughput": 5822.04, "total_tokens": 7815200} {"current_steps": 11985, "total_steps": 33920, "loss": 0.5896, "lr": 8.169579334439453e-06, "epoch": 7.066627358490566, "percentage": 35.33, "elapsed_time": "0:22:22", "remaining_time": "0:40:57", "throughput": 5821.96, "total_tokens": 7817824} {"current_steps": 11990, "total_steps": 33920, "loss": 0.3398, "lr": 8.16758917267608e-06, "epoch": 7.069575471698113, "percentage": 35.35, "elapsed_time": "0:22:23", "remaining_time": "0:40:57", "throughput": 5822.33, "total_tokens": 7821856} {"current_steps": 11995, "total_steps": 33920, "loss": 0.4701, "lr": 8.165598172279822e-06, "epoch": 7.07252358490566, "percentage": 35.36, "elapsed_time": "0:22:23", "remaining_time": "0:40:56", "throughput": 5822.23, "total_tokens": 7824544} {"current_steps": 12000, "total_steps": 33920, "loss": 0.4128, "lr": 8.163606333777804e-06, "epoch": 7.0754716981132075, "percentage": 35.38, "elapsed_time": "0:22:24", "remaining_time": "0:40:55", "throughput": 5822.21, "total_tokens": 7827328} {"current_steps": 12005, "total_steps": 33920, "loss": 0.421, "lr": 8.161613657697374e-06, "epoch": 7.078419811320755, "percentage": 35.39, "elapsed_time": "0:22:24", "remaining_time": "0:40:55", "throughput": 5822.5, "total_tokens": 7830880} {"current_steps": 12010, "total_steps": 33920, "loss": 0.3233, "lr": 8.159620144566103e-06, "epoch": 7.081367924528302, "percentage": 35.41, "elapsed_time": "0:22:25", "remaining_time": "0:40:54", "throughput": 5822.6, "total_tokens": 7833920} {"current_steps": 12015, "total_steps": 33920, "loss": 0.3889, "lr": 8.157625794911782e-06, "epoch": 7.084316037735849, "percentage": 35.42, "elapsed_time": "0:22:25", "remaining_time": "0:40:53", "throughput": 5822.45, "total_tokens": 7836768} {"current_steps": 12020, "total_steps": 33920, "loss": 0.3213, "lr": 8.155630609262424e-06, "epoch": 7.087264150943396, "percentage": 35.44, "elapsed_time": "0:22:26", "remaining_time": "0:40:53", "throughput": 5822.73, "total_tokens": 7840576} {"current_steps": 12025, "total_steps": 33920, "loss": 0.371, "lr": 8.153634588146262e-06, "epoch": 7.090212264150943, "percentage": 35.45, "elapsed_time": "0:22:27", "remaining_time": "0:40:52", "throughput": 5823.03, "total_tokens": 7844000} {"current_steps": 12030, "total_steps": 33920, "loss": 0.4403, "lr": 8.15163773209175e-06, "epoch": 7.09316037735849, "percentage": 35.47, "elapsed_time": "0:22:27", "remaining_time": "0:40:52", "throughput": 5823.13, "total_tokens": 7847072} {"current_steps": 12035, "total_steps": 33920, "loss": 0.3444, "lr": 8.149640041627566e-06, "epoch": 7.096108490566038, "percentage": 35.48, "elapsed_time": "0:22:28", "remaining_time": "0:40:51", "throughput": 5823.63, "total_tokens": 7851264} {"current_steps": 12040, "total_steps": 33920, "loss": 0.5278, "lr": 8.147641517282608e-06, "epoch": 7.099056603773585, "percentage": 35.5, "elapsed_time": "0:22:28", "remaining_time": "0:40:50", "throughput": 5823.78, "total_tokens": 7854656} {"current_steps": 12045, "total_steps": 33920, "loss": 0.5214, "lr": 8.145642159585992e-06, "epoch": 7.102004716981132, "percentage": 35.51, "elapsed_time": "0:22:29", "remaining_time": "0:40:50", "throughput": 5824.23, "total_tokens": 7859520} {"current_steps": 12050, "total_steps": 33920, "loss": 0.3462, "lr": 8.143641969067057e-06, "epoch": 7.1049528301886795, "percentage": 35.52, "elapsed_time": "0:22:29", "remaining_time": "0:40:50", "throughput": 5824.18, "total_tokens": 7862400} {"current_steps": 12055, "total_steps": 33920, "loss": 0.3447, "lr": 8.141640946255362e-06, "epoch": 7.107900943396227, "percentage": 35.54, "elapsed_time": "0:22:30", "remaining_time": "0:40:49", "throughput": 5823.86, "total_tokens": 7865088} {"current_steps": 12060, "total_steps": 33920, "loss": 0.3318, "lr": 8.139639091680687e-06, "epoch": 7.110849056603773, "percentage": 35.55, "elapsed_time": "0:22:31", "remaining_time": "0:40:48", "throughput": 5824.16, "total_tokens": 7868736} {"current_steps": 12065, "total_steps": 33920, "loss": 0.5793, "lr": 8.137636405873031e-06, "epoch": 7.1137971698113205, "percentage": 35.57, "elapsed_time": "0:22:31", "remaining_time": "0:40:48", "throughput": 5824.18, "total_tokens": 7871552} {"current_steps": 12070, "total_steps": 33920, "loss": 0.4085, "lr": 8.135632889362614e-06, "epoch": 7.116745283018868, "percentage": 35.58, "elapsed_time": "0:22:32", "remaining_time": "0:40:47", "throughput": 5824.05, "total_tokens": 7874240} {"current_steps": 12075, "total_steps": 33920, "loss": 0.4844, "lr": 8.133628542679879e-06, "epoch": 7.119693396226415, "percentage": 35.6, "elapsed_time": "0:22:32", "remaining_time": "0:40:46", "throughput": 5824.12, "total_tokens": 7877632} {"current_steps": 12080, "total_steps": 33920, "loss": 0.4264, "lr": 8.131623366355478e-06, "epoch": 7.122641509433962, "percentage": 35.61, "elapsed_time": "0:22:33", "remaining_time": "0:40:46", "throughput": 5823.98, "total_tokens": 7880160} {"current_steps": 12085, "total_steps": 33920, "loss": 0.4005, "lr": 8.129617360920297e-06, "epoch": 7.12558962264151, "percentage": 35.63, "elapsed_time": "0:22:33", "remaining_time": "0:40:45", "throughput": 5824.02, "total_tokens": 7883136} {"current_steps": 12090, "total_steps": 33920, "loss": 0.2636, "lr": 8.12761052690543e-06, "epoch": 7.128537735849057, "percentage": 35.64, "elapsed_time": "0:22:34", "remaining_time": "0:40:44", "throughput": 5823.56, "total_tokens": 7885408} {"current_steps": 12095, "total_steps": 33920, "loss": 0.4684, "lr": 8.125602864842197e-06, "epoch": 7.131485849056604, "percentage": 35.66, "elapsed_time": "0:22:34", "remaining_time": "0:40:44", "throughput": 5823.63, "total_tokens": 7888224} {"current_steps": 12100, "total_steps": 33920, "loss": 0.4637, "lr": 8.123594375262135e-06, "epoch": 7.134433962264151, "percentage": 35.67, "elapsed_time": "0:22:35", "remaining_time": "0:40:43", "throughput": 5823.96, "total_tokens": 7891808} {"current_steps": 12105, "total_steps": 33920, "loss": 0.4083, "lr": 8.121585058697e-06, "epoch": 7.137382075471698, "percentage": 35.69, "elapsed_time": "0:22:35", "remaining_time": "0:40:42", "throughput": 5824.05, "total_tokens": 7894912} {"current_steps": 12110, "total_steps": 33920, "loss": 0.5051, "lr": 8.119574915678767e-06, "epoch": 7.140330188679245, "percentage": 35.7, "elapsed_time": "0:22:36", "remaining_time": "0:40:42", "throughput": 5824.36, "total_tokens": 7898560} {"current_steps": 12115, "total_steps": 33920, "loss": 0.345, "lr": 8.117563946739632e-06, "epoch": 7.1432783018867925, "percentage": 35.72, "elapsed_time": "0:22:36", "remaining_time": "0:40:41", "throughput": 5824.29, "total_tokens": 7901248} {"current_steps": 12120, "total_steps": 33920, "loss": 0.3347, "lr": 8.115552152412006e-06, "epoch": 7.14622641509434, "percentage": 35.73, "elapsed_time": "0:22:37", "remaining_time": "0:40:41", "throughput": 5824.58, "total_tokens": 7905088} {"current_steps": 12125, "total_steps": 33920, "loss": 0.4253, "lr": 8.11353953322852e-06, "epoch": 7.149174528301887, "percentage": 35.75, "elapsed_time": "0:22:37", "remaining_time": "0:40:40", "throughput": 5824.53, "total_tokens": 7907936} {"current_steps": 12130, "total_steps": 33920, "loss": 0.424, "lr": 8.111526089722024e-06, "epoch": 7.152122641509434, "percentage": 35.76, "elapsed_time": "0:22:38", "remaining_time": "0:40:39", "throughput": 5824.41, "total_tokens": 7910496} {"current_steps": 12135, "total_steps": 33920, "loss": 0.4137, "lr": 8.109511822425586e-06, "epoch": 7.155070754716981, "percentage": 35.78, "elapsed_time": "0:22:38", "remaining_time": "0:40:39", "throughput": 5824.62, "total_tokens": 7913856} {"current_steps": 12140, "total_steps": 33920, "loss": 0.3229, "lr": 8.107496731872491e-06, "epoch": 7.158018867924528, "percentage": 35.79, "elapsed_time": "0:22:39", "remaining_time": "0:40:39", "throughput": 5824.93, "total_tokens": 7919200} {"current_steps": 12145, "total_steps": 33920, "loss": 0.3888, "lr": 8.105480818596243e-06, "epoch": 7.160966981132075, "percentage": 35.8, "elapsed_time": "0:22:40", "remaining_time": "0:40:38", "throughput": 5824.8, "total_tokens": 7922048} {"current_steps": 12150, "total_steps": 33920, "loss": 0.401, "lr": 8.103464083130566e-06, "epoch": 7.163915094339623, "percentage": 35.82, "elapsed_time": "0:22:40", "remaining_time": "0:40:37", "throughput": 5824.7, "total_tokens": 7924672} {"current_steps": 12155, "total_steps": 33920, "loss": 0.4345, "lr": 8.101446526009397e-06, "epoch": 7.16686320754717, "percentage": 35.83, "elapsed_time": "0:22:41", "remaining_time": "0:40:37", "throughput": 5824.89, "total_tokens": 7927744} {"current_steps": 12160, "total_steps": 33920, "loss": 0.347, "lr": 8.099428147766894e-06, "epoch": 7.169811320754717, "percentage": 35.85, "elapsed_time": "0:22:41", "remaining_time": "0:40:36", "throughput": 5824.93, "total_tokens": 7930816} {"current_steps": 12165, "total_steps": 33920, "loss": 0.4496, "lr": 8.097408948937431e-06, "epoch": 7.1727594339622645, "percentage": 35.86, "elapsed_time": "0:22:42", "remaining_time": "0:40:35", "throughput": 5824.77, "total_tokens": 7933408} {"current_steps": 12170, "total_steps": 33920, "loss": 0.3722, "lr": 8.095388930055599e-06, "epoch": 7.175707547169812, "percentage": 35.88, "elapsed_time": "0:22:42", "remaining_time": "0:40:35", "throughput": 5825.08, "total_tokens": 7937216} {"current_steps": 12175, "total_steps": 33920, "loss": 0.3512, "lr": 8.093368091656209e-06, "epoch": 7.178655660377358, "percentage": 35.89, "elapsed_time": "0:22:43", "remaining_time": "0:40:34", "throughput": 5825.36, "total_tokens": 7940800} {"current_steps": 12180, "total_steps": 33920, "loss": 0.4128, "lr": 8.091346434274284e-06, "epoch": 7.181603773584905, "percentage": 35.91, "elapsed_time": "0:22:43", "remaining_time": "0:40:34", "throughput": 5825.45, "total_tokens": 7944000} {"current_steps": 12185, "total_steps": 33920, "loss": 0.4007, "lr": 8.089323958445068e-06, "epoch": 7.184551886792453, "percentage": 35.92, "elapsed_time": "0:22:44", "remaining_time": "0:40:33", "throughput": 5825.07, "total_tokens": 7946144} {"current_steps": 12190, "total_steps": 33920, "loss": 0.4061, "lr": 8.08730066470402e-06, "epoch": 7.1875, "percentage": 35.94, "elapsed_time": "0:22:44", "remaining_time": "0:40:32", "throughput": 5824.71, "total_tokens": 7948416} {"current_steps": 12195, "total_steps": 33920, "loss": 0.3687, "lr": 8.085276553586814e-06, "epoch": 7.190448113207547, "percentage": 35.95, "elapsed_time": "0:22:45", "remaining_time": "0:40:31", "throughput": 5824.52, "total_tokens": 7950976} {"current_steps": 12200, "total_steps": 33920, "loss": 0.4074, "lr": 8.083251625629345e-06, "epoch": 7.193396226415095, "percentage": 35.97, "elapsed_time": "0:22:45", "remaining_time": "0:40:31", "throughput": 5824.34, "total_tokens": 7953824} {"current_steps": 12205, "total_steps": 33920, "loss": 0.4512, "lr": 8.08122588136772e-06, "epoch": 7.196344339622642, "percentage": 35.98, "elapsed_time": "0:22:46", "remaining_time": "0:40:30", "throughput": 5824.24, "total_tokens": 7956576} {"current_steps": 12210, "total_steps": 33920, "loss": 0.4588, "lr": 8.079199321338262e-06, "epoch": 7.199292452830188, "percentage": 36.0, "elapsed_time": "0:22:46", "remaining_time": "0:40:29", "throughput": 5824.35, "total_tokens": 7959584} {"current_steps": 12215, "total_steps": 33920, "loss": 0.411, "lr": 8.077171946077516e-06, "epoch": 7.2022405660377355, "percentage": 36.01, "elapsed_time": "0:22:47", "remaining_time": "0:40:29", "throughput": 5824.66, "total_tokens": 7963712} {"current_steps": 12220, "total_steps": 33920, "loss": 0.415, "lr": 8.075143756122232e-06, "epoch": 7.205188679245283, "percentage": 36.03, "elapsed_time": "0:22:47", "remaining_time": "0:40:28", "throughput": 5824.99, "total_tokens": 7967680} {"current_steps": 12225, "total_steps": 33920, "loss": 0.379, "lr": 8.073114752009388e-06, "epoch": 7.20813679245283, "percentage": 36.04, "elapsed_time": "0:22:48", "remaining_time": "0:40:28", "throughput": 5824.98, "total_tokens": 7970464} {"current_steps": 12230, "total_steps": 33920, "loss": 0.5107, "lr": 8.071084934276168e-06, "epoch": 7.211084905660377, "percentage": 36.06, "elapsed_time": "0:22:48", "remaining_time": "0:40:27", "throughput": 5825.16, "total_tokens": 7973696} {"current_steps": 12235, "total_steps": 33920, "loss": 0.3574, "lr": 8.069054303459976e-06, "epoch": 7.214033018867925, "percentage": 36.07, "elapsed_time": "0:22:49", "remaining_time": "0:40:26", "throughput": 5825.13, "total_tokens": 7976352} {"current_steps": 12240, "total_steps": 33920, "loss": 0.5213, "lr": 8.06702286009843e-06, "epoch": 7.216981132075472, "percentage": 36.08, "elapsed_time": "0:22:49", "remaining_time": "0:40:26", "throughput": 5825.26, "total_tokens": 7979712} {"current_steps": 12245, "total_steps": 33920, "loss": 0.4471, "lr": 8.064990604729363e-06, "epoch": 7.219929245283019, "percentage": 36.1, "elapsed_time": "0:22:50", "remaining_time": "0:40:25", "throughput": 5825.2, "total_tokens": 7982656} {"current_steps": 12250, "total_steps": 33920, "loss": 0.3829, "lr": 8.062957537890827e-06, "epoch": 7.222877358490566, "percentage": 36.11, "elapsed_time": "0:22:50", "remaining_time": "0:40:25", "throughput": 5825.14, "total_tokens": 7985408} {"current_steps": 12255, "total_steps": 33920, "loss": 0.4369, "lr": 8.060923660121081e-06, "epoch": 7.225825471698113, "percentage": 36.13, "elapsed_time": "0:22:51", "remaining_time": "0:40:24", "throughput": 5825.18, "total_tokens": 7988128} {"current_steps": 12260, "total_steps": 33920, "loss": 0.4046, "lr": 8.058888971958603e-06, "epoch": 7.22877358490566, "percentage": 36.14, "elapsed_time": "0:22:51", "remaining_time": "0:40:23", "throughput": 5825.28, "total_tokens": 7991136} {"current_steps": 12265, "total_steps": 33920, "loss": 0.3102, "lr": 8.056853473942085e-06, "epoch": 7.2317216981132075, "percentage": 36.16, "elapsed_time": "0:22:52", "remaining_time": "0:40:22", "throughput": 5825.36, "total_tokens": 7994176} {"current_steps": 12270, "total_steps": 33920, "loss": 0.4642, "lr": 8.054817166610438e-06, "epoch": 7.234669811320755, "percentage": 36.17, "elapsed_time": "0:22:52", "remaining_time": "0:40:22", "throughput": 5825.41, "total_tokens": 7997184} {"current_steps": 12275, "total_steps": 33920, "loss": 0.3713, "lr": 8.052780050502781e-06, "epoch": 7.237617924528302, "percentage": 36.19, "elapsed_time": "0:22:53", "remaining_time": "0:40:21", "throughput": 5825.71, "total_tokens": 8001056} {"current_steps": 12280, "total_steps": 33920, "loss": 0.4258, "lr": 8.050742126158448e-06, "epoch": 7.240566037735849, "percentage": 36.2, "elapsed_time": "0:22:53", "remaining_time": "0:40:21", "throughput": 5825.76, "total_tokens": 8004416} {"current_steps": 12285, "total_steps": 33920, "loss": 0.5149, "lr": 8.04870339411699e-06, "epoch": 7.243514150943396, "percentage": 36.22, "elapsed_time": "0:22:54", "remaining_time": "0:40:20", "throughput": 5826.11, "total_tokens": 8008768} {"current_steps": 12290, "total_steps": 33920, "loss": 0.4366, "lr": 8.046663854918166e-06, "epoch": 7.246462264150943, "percentage": 36.23, "elapsed_time": "0:22:55", "remaining_time": "0:40:20", "throughput": 5826.32, "total_tokens": 8012192} {"current_steps": 12295, "total_steps": 33920, "loss": 0.3766, "lr": 8.044623509101959e-06, "epoch": 7.24941037735849, "percentage": 36.25, "elapsed_time": "0:22:55", "remaining_time": "0:40:19", "throughput": 5826.43, "total_tokens": 8015616} {"current_steps": 12300, "total_steps": 33920, "loss": 0.3876, "lr": 8.042582357208557e-06, "epoch": 7.252358490566038, "percentage": 36.26, "elapsed_time": "0:22:56", "remaining_time": "0:40:19", "throughput": 5826.51, "total_tokens": 8018752} {"current_steps": 12305, "total_steps": 33920, "loss": 0.4784, "lr": 8.04054039977836e-06, "epoch": 7.255306603773585, "percentage": 36.28, "elapsed_time": "0:22:56", "remaining_time": "0:40:18", "throughput": 5826.87, "total_tokens": 8022656} {"current_steps": 12310, "total_steps": 33920, "loss": 0.3863, "lr": 8.038497637351992e-06, "epoch": 7.258254716981132, "percentage": 36.29, "elapsed_time": "0:22:57", "remaining_time": "0:40:17", "throughput": 5827.12, "total_tokens": 8025984} {"current_steps": 12315, "total_steps": 33920, "loss": 0.523, "lr": 8.036454070470276e-06, "epoch": 7.2612028301886795, "percentage": 36.31, "elapsed_time": "0:22:57", "remaining_time": "0:40:17", "throughput": 5826.78, "total_tokens": 8028352} {"current_steps": 12320, "total_steps": 33920, "loss": 0.4538, "lr": 8.03440969967426e-06, "epoch": 7.264150943396227, "percentage": 36.32, "elapsed_time": "0:22:58", "remaining_time": "0:40:16", "throughput": 5826.65, "total_tokens": 8030912} {"current_steps": 12325, "total_steps": 33920, "loss": 0.3874, "lr": 8.032364525505198e-06, "epoch": 7.267099056603773, "percentage": 36.34, "elapsed_time": "0:22:58", "remaining_time": "0:40:15", "throughput": 5826.96, "total_tokens": 8034432} {"current_steps": 12330, "total_steps": 33920, "loss": 0.6288, "lr": 8.030318548504561e-06, "epoch": 7.2700471698113205, "percentage": 36.35, "elapsed_time": "0:22:59", "remaining_time": "0:40:15", "throughput": 5827.07, "total_tokens": 8037440} {"current_steps": 12335, "total_steps": 33920, "loss": 0.3659, "lr": 8.028271769214026e-06, "epoch": 7.272995283018868, "percentage": 36.36, "elapsed_time": "0:22:59", "remaining_time": "0:40:14", "throughput": 5826.98, "total_tokens": 8040064} {"current_steps": 12340, "total_steps": 33920, "loss": 0.4535, "lr": 8.02622418817549e-06, "epoch": 7.275943396226415, "percentage": 36.38, "elapsed_time": "0:23:00", "remaining_time": "0:40:14", "throughput": 5827.22, "total_tokens": 8043840} {"current_steps": 12345, "total_steps": 33920, "loss": 0.5111, "lr": 8.024175805931056e-06, "epoch": 7.278891509433962, "percentage": 36.39, "elapsed_time": "0:23:00", "remaining_time": "0:40:13", "throughput": 5827.41, "total_tokens": 8047392} {"current_steps": 12350, "total_steps": 33920, "loss": 0.398, "lr": 8.022126623023045e-06, "epoch": 7.28183962264151, "percentage": 36.41, "elapsed_time": "0:23:01", "remaining_time": "0:40:12", "throughput": 5827.44, "total_tokens": 8050080} {"current_steps": 12355, "total_steps": 33920, "loss": 0.4353, "lr": 8.020076639993987e-06, "epoch": 7.284787735849057, "percentage": 36.42, "elapsed_time": "0:23:01", "remaining_time": "0:40:12", "throughput": 5827.64, "total_tokens": 8053504} {"current_steps": 12360, "total_steps": 33920, "loss": 0.3766, "lr": 8.018025857386622e-06, "epoch": 7.287735849056604, "percentage": 36.44, "elapsed_time": "0:23:02", "remaining_time": "0:40:11", "throughput": 5827.64, "total_tokens": 8056256} {"current_steps": 12365, "total_steps": 33920, "loss": 0.3381, "lr": 8.015974275743905e-06, "epoch": 7.290683962264151, "percentage": 36.45, "elapsed_time": "0:23:02", "remaining_time": "0:40:10", "throughput": 5827.83, "total_tokens": 8059616} {"current_steps": 12370, "total_steps": 33920, "loss": 0.2365, "lr": 8.013921895609e-06, "epoch": 7.293632075471698, "percentage": 36.47, "elapsed_time": "0:23:03", "remaining_time": "0:40:10", "throughput": 5828.1, "total_tokens": 8062944} {"current_steps": 12375, "total_steps": 33920, "loss": 0.3709, "lr": 8.011868717525283e-06, "epoch": 7.296580188679245, "percentage": 36.48, "elapsed_time": "0:23:04", "remaining_time": "0:40:09", "throughput": 5828.51, "total_tokens": 8067008} {"current_steps": 12380, "total_steps": 33920, "loss": 0.4789, "lr": 8.009814742036343e-06, "epoch": 7.2995283018867925, "percentage": 36.5, "elapsed_time": "0:23:04", "remaining_time": "0:40:08", "throughput": 5828.34, "total_tokens": 8069632} {"current_steps": 12385, "total_steps": 33920, "loss": 0.3749, "lr": 8.007759969685979e-06, "epoch": 7.30247641509434, "percentage": 36.51, "elapsed_time": "0:23:04", "remaining_time": "0:40:08", "throughput": 5828.33, "total_tokens": 8072160} {"current_steps": 12390, "total_steps": 33920, "loss": 0.4917, "lr": 8.005704401018199e-06, "epoch": 7.305424528301887, "percentage": 36.53, "elapsed_time": "0:23:05", "remaining_time": "0:40:07", "throughput": 5828.55, "total_tokens": 8075488} {"current_steps": 12395, "total_steps": 33920, "loss": 0.4914, "lr": 8.003648036577226e-06, "epoch": 7.308372641509434, "percentage": 36.54, "elapsed_time": "0:23:06", "remaining_time": "0:40:07", "throughput": 5828.8, "total_tokens": 8079040} {"current_steps": 12400, "total_steps": 33920, "loss": 0.3792, "lr": 8.00159087690749e-06, "epoch": 7.311320754716981, "percentage": 36.56, "elapsed_time": "0:23:06", "remaining_time": "0:40:06", "throughput": 5828.79, "total_tokens": 8081728} {"current_steps": 12405, "total_steps": 33920, "loss": 0.3497, "lr": 7.999532922553635e-06, "epoch": 7.314268867924528, "percentage": 36.57, "elapsed_time": "0:23:07", "remaining_time": "0:40:05", "throughput": 5828.98, "total_tokens": 8084832} {"current_steps": 12410, "total_steps": 33920, "loss": 0.4747, "lr": 7.997474174060508e-06, "epoch": 7.317216981132075, "percentage": 36.59, "elapsed_time": "0:23:07", "remaining_time": "0:40:05", "throughput": 5829.21, "total_tokens": 8088416} {"current_steps": 12415, "total_steps": 33920, "loss": 0.2893, "lr": 7.995414631973179e-06, "epoch": 7.320165094339623, "percentage": 36.6, "elapsed_time": "0:23:08", "remaining_time": "0:40:04", "throughput": 5829.4, "total_tokens": 8091584} {"current_steps": 12420, "total_steps": 33920, "loss": 0.2884, "lr": 7.993354296836914e-06, "epoch": 7.32311320754717, "percentage": 36.62, "elapsed_time": "0:23:08", "remaining_time": "0:40:03", "throughput": 5829.37, "total_tokens": 8094208} {"current_steps": 12425, "total_steps": 33920, "loss": 0.3217, "lr": 7.991293169197198e-06, "epoch": 7.326061320754717, "percentage": 36.63, "elapsed_time": "0:23:08", "remaining_time": "0:40:02", "throughput": 5829.29, "total_tokens": 8096864} {"current_steps": 12430, "total_steps": 33920, "loss": 0.4849, "lr": 7.989231249599725e-06, "epoch": 7.3290094339622645, "percentage": 36.65, "elapsed_time": "0:23:09", "remaining_time": "0:40:02", "throughput": 5829.34, "total_tokens": 8099712} {"current_steps": 12435, "total_steps": 33920, "loss": 0.3672, "lr": 7.987168538590395e-06, "epoch": 7.331957547169811, "percentage": 36.66, "elapsed_time": "0:23:09", "remaining_time": "0:40:01", "throughput": 5829.37, "total_tokens": 8102400} {"current_steps": 12440, "total_steps": 33920, "loss": 0.2029, "lr": 7.985105036715322e-06, "epoch": 7.334905660377358, "percentage": 36.67, "elapsed_time": "0:23:10", "remaining_time": "0:40:01", "throughput": 5830.05, "total_tokens": 8108288} {"current_steps": 12445, "total_steps": 33920, "loss": 0.2693, "lr": 7.983040744520823e-06, "epoch": 7.337853773584905, "percentage": 36.69, "elapsed_time": "0:23:11", "remaining_time": "0:40:00", "throughput": 5829.93, "total_tokens": 8111008} {"current_steps": 12450, "total_steps": 33920, "loss": 0.4571, "lr": 7.980975662553432e-06, "epoch": 7.340801886792453, "percentage": 36.7, "elapsed_time": "0:23:11", "remaining_time": "0:40:00", "throughput": 5830.22, "total_tokens": 8115008} {"current_steps": 12455, "total_steps": 33920, "loss": 0.3693, "lr": 7.978909791359888e-06, "epoch": 7.34375, "percentage": 36.72, "elapsed_time": "0:23:12", "remaining_time": "0:39:59", "throughput": 5830.45, "total_tokens": 8118752} {"current_steps": 12460, "total_steps": 33920, "loss": 0.5031, "lr": 7.976843131487136e-06, "epoch": 7.346698113207547, "percentage": 36.73, "elapsed_time": "0:23:12", "remaining_time": "0:39:59", "throughput": 5830.69, "total_tokens": 8122048} {"current_steps": 12465, "total_steps": 33920, "loss": 0.4317, "lr": 7.974775683482337e-06, "epoch": 7.349646226415095, "percentage": 36.75, "elapsed_time": "0:23:13", "remaining_time": "0:39:58", "throughput": 5830.39, "total_tokens": 8124448} {"current_steps": 12470, "total_steps": 33920, "loss": 0.5957, "lr": 7.972707447892855e-06, "epoch": 7.352594339622642, "percentage": 36.76, "elapsed_time": "0:23:14", "remaining_time": "0:39:58", "throughput": 5830.36, "total_tokens": 8128096} {"current_steps": 12475, "total_steps": 33920, "loss": 0.5007, "lr": 7.970638425266264e-06, "epoch": 7.355542452830189, "percentage": 36.78, "elapsed_time": "0:23:14", "remaining_time": "0:39:57", "throughput": 5830.32, "total_tokens": 8131488} {"current_steps": 12480, "total_steps": 33920, "loss": 0.3962, "lr": 7.968568616150349e-06, "epoch": 7.3584905660377355, "percentage": 36.79, "elapsed_time": "0:23:15", "remaining_time": "0:39:56", "throughput": 5830.45, "total_tokens": 8134688} {"current_steps": 12485, "total_steps": 33920, "loss": 0.3502, "lr": 7.966498021093096e-06, "epoch": 7.361438679245283, "percentage": 36.81, "elapsed_time": "0:23:15", "remaining_time": "0:39:56", "throughput": 5830.51, "total_tokens": 8138368} {"current_steps": 12490, "total_steps": 33920, "loss": 0.5062, "lr": 7.96442664064271e-06, "epoch": 7.36438679245283, "percentage": 36.82, "elapsed_time": "0:23:16", "remaining_time": "0:39:55", "throughput": 5830.62, "total_tokens": 8141408} {"current_steps": 12495, "total_steps": 33920, "loss": 0.4325, "lr": 7.962354475347593e-06, "epoch": 7.367334905660377, "percentage": 36.84, "elapsed_time": "0:23:16", "remaining_time": "0:39:55", "throughput": 5830.34, "total_tokens": 8143872} {"current_steps": 12500, "total_steps": 33920, "loss": 0.2763, "lr": 7.960281525756364e-06, "epoch": 7.370283018867925, "percentage": 36.85, "elapsed_time": "0:23:17", "remaining_time": "0:39:54", "throughput": 5830.79, "total_tokens": 8148096} {"current_steps": 12505, "total_steps": 33920, "loss": 0.5184, "lr": 7.95820779241784e-06, "epoch": 7.373231132075472, "percentage": 36.87, "elapsed_time": "0:23:17", "remaining_time": "0:39:53", "throughput": 5830.68, "total_tokens": 8150848} {"current_steps": 12510, "total_steps": 33920, "loss": 0.4826, "lr": 7.956133275881055e-06, "epoch": 7.376179245283019, "percentage": 36.88, "elapsed_time": "0:23:18", "remaining_time": "0:39:53", "throughput": 5831.18, "total_tokens": 8155232} {"current_steps": 12515, "total_steps": 33920, "loss": 0.4783, "lr": 7.954057976695244e-06, "epoch": 7.379127358490566, "percentage": 36.9, "elapsed_time": "0:23:19", "remaining_time": "0:39:53", "throughput": 5831.41, "total_tokens": 8158912} {"current_steps": 12520, "total_steps": 33920, "loss": 0.3174, "lr": 7.951981895409854e-06, "epoch": 7.382075471698113, "percentage": 36.91, "elapsed_time": "0:23:19", "remaining_time": "0:39:52", "throughput": 5831.29, "total_tokens": 8161696} {"current_steps": 12525, "total_steps": 33920, "loss": 0.4056, "lr": 7.949905032574534e-06, "epoch": 7.38502358490566, "percentage": 36.93, "elapsed_time": "0:23:20", "remaining_time": "0:39:51", "throughput": 5831.81, "total_tokens": 8166272} {"current_steps": 12530, "total_steps": 33920, "loss": 0.5553, "lr": 7.947827388739145e-06, "epoch": 7.3879716981132075, "percentage": 36.94, "elapsed_time": "0:23:20", "remaining_time": "0:39:51", "throughput": 5831.97, "total_tokens": 8169504} {"current_steps": 12535, "total_steps": 33920, "loss": 0.468, "lr": 7.945748964453747e-06, "epoch": 7.390919811320755, "percentage": 36.95, "elapsed_time": "0:23:21", "remaining_time": "0:39:50", "throughput": 5832.11, "total_tokens": 8172800} {"current_steps": 12540, "total_steps": 33920, "loss": 0.511, "lr": 7.943669760268618e-06, "epoch": 7.393867924528302, "percentage": 36.97, "elapsed_time": "0:23:21", "remaining_time": "0:39:50", "throughput": 5832.22, "total_tokens": 8176480} {"current_steps": 12545, "total_steps": 33920, "loss": 0.4246, "lr": 7.941589776734232e-06, "epoch": 7.396816037735849, "percentage": 36.98, "elapsed_time": "0:23:22", "remaining_time": "0:39:49", "throughput": 5832.37, "total_tokens": 8179616} {"current_steps": 12550, "total_steps": 33920, "loss": 0.3964, "lr": 7.939509014401277e-06, "epoch": 7.399764150943396, "percentage": 37.0, "elapsed_time": "0:23:23", "remaining_time": "0:39:49", "throughput": 5832.65, "total_tokens": 8183488} {"current_steps": 12555, "total_steps": 33920, "loss": 0.4537, "lr": 7.93742747382064e-06, "epoch": 7.402712264150943, "percentage": 37.01, "elapsed_time": "0:23:23", "remaining_time": "0:39:48", "throughput": 5832.56, "total_tokens": 8186592} {"current_steps": 12560, "total_steps": 33920, "loss": 0.3649, "lr": 7.93534515554342e-06, "epoch": 7.40566037735849, "percentage": 37.03, "elapsed_time": "0:23:24", "remaining_time": "0:39:47", "throughput": 5832.83, "total_tokens": 8190048} {"current_steps": 12565, "total_steps": 33920, "loss": 0.4374, "lr": 7.933262060120918e-06, "epoch": 7.408608490566038, "percentage": 37.04, "elapsed_time": "0:23:24", "remaining_time": "0:39:47", "throughput": 5832.99, "total_tokens": 8193440} {"current_steps": 12570, "total_steps": 33920, "loss": 0.4411, "lr": 7.931178188104646e-06, "epoch": 7.411556603773585, "percentage": 37.06, "elapsed_time": "0:23:25", "remaining_time": "0:39:46", "throughput": 5833.23, "total_tokens": 8196736} {"current_steps": 12575, "total_steps": 33920, "loss": 0.5102, "lr": 7.929093540046317e-06, "epoch": 7.414504716981132, "percentage": 37.07, "elapsed_time": "0:23:25", "remaining_time": "0:39:45", "throughput": 5833.15, "total_tokens": 8199456} {"current_steps": 12580, "total_steps": 33920, "loss": 0.6973, "lr": 7.927008116497848e-06, "epoch": 7.4174528301886795, "percentage": 37.09, "elapsed_time": "0:23:26", "remaining_time": "0:39:45", "throughput": 5833.52, "total_tokens": 8203360} {"current_steps": 12585, "total_steps": 33920, "loss": 0.4744, "lr": 7.924921918011366e-06, "epoch": 7.420400943396227, "percentage": 37.1, "elapsed_time": "0:23:26", "remaining_time": "0:39:44", "throughput": 5833.78, "total_tokens": 8207264} {"current_steps": 12590, "total_steps": 33920, "loss": 0.3945, "lr": 7.9228349451392e-06, "epoch": 7.423349056603773, "percentage": 37.12, "elapsed_time": "0:23:27", "remaining_time": "0:39:44", "throughput": 5833.83, "total_tokens": 8210528} {"current_steps": 12595, "total_steps": 33920, "loss": 0.3177, "lr": 7.920747198433884e-06, "epoch": 7.4262971698113205, "percentage": 37.13, "elapsed_time": "0:23:27", "remaining_time": "0:39:43", "throughput": 5833.71, "total_tokens": 8213728} {"current_steps": 12600, "total_steps": 33920, "loss": 0.4901, "lr": 7.91865867844816e-06, "epoch": 7.429245283018868, "percentage": 37.15, "elapsed_time": "0:23:28", "remaining_time": "0:39:43", "throughput": 5833.92, "total_tokens": 8217856} {"current_steps": 12605, "total_steps": 33920, "loss": 0.3317, "lr": 7.916569385734976e-06, "epoch": 7.432193396226415, "percentage": 37.16, "elapsed_time": "0:23:29", "remaining_time": "0:39:42", "throughput": 5833.48, "total_tokens": 8220000} {"current_steps": 12610, "total_steps": 33920, "loss": 0.3992, "lr": 7.914479320847474e-06, "epoch": 7.435141509433962, "percentage": 37.18, "elapsed_time": "0:23:29", "remaining_time": "0:39:42", "throughput": 5833.51, "total_tokens": 8223040} {"current_steps": 12615, "total_steps": 33920, "loss": 0.3922, "lr": 7.912388484339012e-06, "epoch": 7.43808962264151, "percentage": 37.19, "elapsed_time": "0:23:30", "remaining_time": "0:39:41", "throughput": 5833.21, "total_tokens": 8225344} {"current_steps": 12620, "total_steps": 33920, "loss": 0.4717, "lr": 7.910296876763147e-06, "epoch": 7.441037735849057, "percentage": 37.21, "elapsed_time": "0:23:30", "remaining_time": "0:39:40", "throughput": 5833.04, "total_tokens": 8227840} {"current_steps": 12625, "total_steps": 33920, "loss": 0.4376, "lr": 7.90820449867364e-06, "epoch": 7.443985849056604, "percentage": 37.22, "elapsed_time": "0:23:31", "remaining_time": "0:39:40", "throughput": 5833.28, "total_tokens": 8231232} {"current_steps": 12630, "total_steps": 33920, "loss": 0.414, "lr": 7.90611135062446e-06, "epoch": 7.446933962264151, "percentage": 37.23, "elapsed_time": "0:23:31", "remaining_time": "0:39:39", "throughput": 5833.32, "total_tokens": 8234400} {"current_steps": 12635, "total_steps": 33920, "loss": 0.4386, "lr": 7.904017433169775e-06, "epoch": 7.449882075471698, "percentage": 37.25, "elapsed_time": "0:23:32", "remaining_time": "0:39:38", "throughput": 5833.33, "total_tokens": 8237312} {"current_steps": 12640, "total_steps": 33920, "loss": 0.4274, "lr": 7.901922746863957e-06, "epoch": 7.452830188679245, "percentage": 37.26, "elapsed_time": "0:23:32", "remaining_time": "0:39:38", "throughput": 5833.56, "total_tokens": 8240864} {"current_steps": 12645, "total_steps": 33920, "loss": 0.4209, "lr": 7.899827292261589e-06, "epoch": 7.4557783018867925, "percentage": 37.28, "elapsed_time": "0:23:33", "remaining_time": "0:39:37", "throughput": 5833.78, "total_tokens": 8244256} {"current_steps": 12650, "total_steps": 33920, "loss": 0.3408, "lr": 7.897731069917444e-06, "epoch": 7.45872641509434, "percentage": 37.29, "elapsed_time": "0:23:33", "remaining_time": "0:39:37", "throughput": 5834.09, "total_tokens": 8248064} {"current_steps": 12655, "total_steps": 33920, "loss": 0.4101, "lr": 7.895634080386512e-06, "epoch": 7.461674528301887, "percentage": 37.31, "elapsed_time": "0:23:34", "remaining_time": "0:39:36", "throughput": 5834.23, "total_tokens": 8251648} {"current_steps": 12660, "total_steps": 33920, "loss": 0.4067, "lr": 7.893536324223977e-06, "epoch": 7.464622641509434, "percentage": 37.32, "elapsed_time": "0:23:34", "remaining_time": "0:39:36", "throughput": 5834.57, "total_tokens": 8255456} {"current_steps": 12665, "total_steps": 33920, "loss": 0.4408, "lr": 7.89143780198523e-06, "epoch": 7.467570754716981, "percentage": 37.34, "elapsed_time": "0:23:35", "remaining_time": "0:39:35", "throughput": 5834.53, "total_tokens": 8258208} {"current_steps": 12670, "total_steps": 33920, "loss": 0.3645, "lr": 7.889338514225862e-06, "epoch": 7.470518867924528, "percentage": 37.35, "elapsed_time": "0:23:35", "remaining_time": "0:39:34", "throughput": 5834.5, "total_tokens": 8260960} {"current_steps": 12675, "total_steps": 33920, "loss": 0.4477, "lr": 7.887238461501671e-06, "epoch": 7.473466981132075, "percentage": 37.37, "elapsed_time": "0:23:36", "remaining_time": "0:39:33", "throughput": 5834.25, "total_tokens": 8263360} {"current_steps": 12680, "total_steps": 33920, "loss": 0.294, "lr": 7.885137644368654e-06, "epoch": 7.476415094339623, "percentage": 37.38, "elapsed_time": "0:23:36", "remaining_time": "0:39:33", "throughput": 5834.21, "total_tokens": 8266016} {"current_steps": 12685, "total_steps": 33920, "loss": 0.4599, "lr": 7.883036063383012e-06, "epoch": 7.47936320754717, "percentage": 37.4, "elapsed_time": "0:23:37", "remaining_time": "0:39:32", "throughput": 5833.92, "total_tokens": 8268640} {"current_steps": 12690, "total_steps": 33920, "loss": 0.3729, "lr": 7.880933719101148e-06, "epoch": 7.482311320754717, "percentage": 37.41, "elapsed_time": "0:23:37", "remaining_time": "0:39:31", "throughput": 5833.86, "total_tokens": 8271456} {"current_steps": 12695, "total_steps": 33920, "loss": 0.381, "lr": 7.878830612079664e-06, "epoch": 7.4852594339622645, "percentage": 37.43, "elapsed_time": "0:23:38", "remaining_time": "0:39:31", "throughput": 5833.99, "total_tokens": 8274656} {"current_steps": 12700, "total_steps": 33920, "loss": 0.4714, "lr": 7.876726742875369e-06, "epoch": 7.488207547169811, "percentage": 37.44, "elapsed_time": "0:23:38", "remaining_time": "0:39:30", "throughput": 5833.89, "total_tokens": 8277472} {"current_steps": 12705, "total_steps": 33920, "loss": 0.4641, "lr": 7.874622112045269e-06, "epoch": 7.491155660377358, "percentage": 37.46, "elapsed_time": "0:23:39", "remaining_time": "0:39:30", "throughput": 5834.12, "total_tokens": 8280800} {"current_steps": 12710, "total_steps": 33920, "loss": 0.3916, "lr": 7.872516720146578e-06, "epoch": 7.494103773584905, "percentage": 37.47, "elapsed_time": "0:23:39", "remaining_time": "0:39:29", "throughput": 5834.1, "total_tokens": 8283712} {"current_steps": 12715, "total_steps": 33920, "loss": 0.37, "lr": 7.870410567736705e-06, "epoch": 7.497051886792453, "percentage": 37.49, "elapsed_time": "0:23:40", "remaining_time": "0:39:28", "throughput": 5834.45, "total_tokens": 8287872} {"current_steps": 12720, "total_steps": 33920, "loss": 0.3059, "lr": 7.868303655373264e-06, "epoch": 7.5, "percentage": 37.5, "elapsed_time": "0:23:41", "remaining_time": "0:39:28", "throughput": 5834.59, "total_tokens": 8291328} {"current_steps": 12725, "total_steps": 33920, "loss": 0.5107, "lr": 7.866195983614066e-06, "epoch": 7.502948113207547, "percentage": 37.51, "elapsed_time": "0:23:41", "remaining_time": "0:39:27", "throughput": 5834.52, "total_tokens": 8293920} {"current_steps": 12730, "total_steps": 33920, "loss": 0.5651, "lr": 7.864087553017133e-06, "epoch": 7.505896226415095, "percentage": 37.53, "elapsed_time": "0:23:42", "remaining_time": "0:39:27", "throughput": 5834.47, "total_tokens": 8296704} {"current_steps": 12735, "total_steps": 33920, "loss": 0.4373, "lr": 7.861978364140674e-06, "epoch": 7.508844339622642, "percentage": 37.54, "elapsed_time": "0:23:42", "remaining_time": "0:39:26", "throughput": 5834.9, "total_tokens": 8301792} {"current_steps": 12740, "total_steps": 33920, "loss": 0.4092, "lr": 7.859868417543109e-06, "epoch": 7.511792452830189, "percentage": 37.56, "elapsed_time": "0:23:43", "remaining_time": "0:39:26", "throughput": 5835.05, "total_tokens": 8305312} {"current_steps": 12745, "total_steps": 33920, "loss": 0.3922, "lr": 7.857757713783055e-06, "epoch": 7.5147405660377355, "percentage": 37.57, "elapsed_time": "0:23:43", "remaining_time": "0:39:25", "throughput": 5835.23, "total_tokens": 8308832} {"current_steps": 12750, "total_steps": 33920, "loss": 0.3832, "lr": 7.855646253419331e-06, "epoch": 7.517688679245283, "percentage": 37.59, "elapsed_time": "0:23:44", "remaining_time": "0:39:25", "throughput": 5835.01, "total_tokens": 8311200} {"current_steps": 12755, "total_steps": 33920, "loss": 0.4667, "lr": 7.853534037010952e-06, "epoch": 7.52063679245283, "percentage": 37.6, "elapsed_time": "0:23:44", "remaining_time": "0:39:24", "throughput": 5834.99, "total_tokens": 8313952} {"current_steps": 12760, "total_steps": 33920, "loss": 0.4567, "lr": 7.851421065117142e-06, "epoch": 7.523584905660377, "percentage": 37.62, "elapsed_time": "0:23:45", "remaining_time": "0:39:23", "throughput": 5835.06, "total_tokens": 8317024} {"current_steps": 12765, "total_steps": 33920, "loss": 0.382, "lr": 7.849307338297314e-06, "epoch": 7.526533018867925, "percentage": 37.63, "elapsed_time": "0:23:45", "remaining_time": "0:39:23", "throughput": 5834.61, "total_tokens": 8319648} {"current_steps": 12770, "total_steps": 33920, "loss": 0.3355, "lr": 7.847192857111087e-06, "epoch": 7.529481132075472, "percentage": 37.65, "elapsed_time": "0:23:46", "remaining_time": "0:39:22", "throughput": 5834.7, "total_tokens": 8322848} {"current_steps": 12775, "total_steps": 33920, "loss": 0.5652, "lr": 7.845077622118282e-06, "epoch": 7.532429245283019, "percentage": 37.66, "elapsed_time": "0:23:46", "remaining_time": "0:39:21", "throughput": 5834.72, "total_tokens": 8325664} {"current_steps": 12780, "total_steps": 33920, "loss": 0.544, "lr": 7.842961633878916e-06, "epoch": 7.535377358490566, "percentage": 37.68, "elapsed_time": "0:23:47", "remaining_time": "0:39:21", "throughput": 5835.19, "total_tokens": 8330144} {"current_steps": 12785, "total_steps": 33920, "loss": 0.4593, "lr": 7.840844892953204e-06, "epoch": 7.538325471698113, "percentage": 37.69, "elapsed_time": "0:23:48", "remaining_time": "0:39:20", "throughput": 5835.2, "total_tokens": 8333344} {"current_steps": 12790, "total_steps": 33920, "loss": 0.4677, "lr": 7.838727399901562e-06, "epoch": 7.54127358490566, "percentage": 37.71, "elapsed_time": "0:23:48", "remaining_time": "0:39:20", "throughput": 5835.68, "total_tokens": 8337920} {"current_steps": 12795, "total_steps": 33920, "loss": 0.399, "lr": 7.836609155284607e-06, "epoch": 7.5442216981132075, "percentage": 37.72, "elapsed_time": "0:23:49", "remaining_time": "0:39:19", "throughput": 5835.64, "total_tokens": 8340704} {"current_steps": 12800, "total_steps": 33920, "loss": 0.3755, "lr": 7.834490159663154e-06, "epoch": 7.547169811320755, "percentage": 37.74, "elapsed_time": "0:23:49", "remaining_time": "0:39:19", "throughput": 5835.7, "total_tokens": 8343872} {"current_steps": 12805, "total_steps": 33920, "loss": 0.3324, "lr": 7.832370413598215e-06, "epoch": 7.550117924528302, "percentage": 37.75, "elapsed_time": "0:23:50", "remaining_time": "0:39:18", "throughput": 5835.96, "total_tokens": 8347456} {"current_steps": 12810, "total_steps": 33920, "loss": 0.5419, "lr": 7.830249917651003e-06, "epoch": 7.553066037735849, "percentage": 37.77, "elapsed_time": "0:23:50", "remaining_time": "0:39:17", "throughput": 5836.03, "total_tokens": 8350688} {"current_steps": 12815, "total_steps": 33920, "loss": 0.4354, "lr": 7.828128672382926e-06, "epoch": 7.556014150943396, "percentage": 37.78, "elapsed_time": "0:23:51", "remaining_time": "0:39:17", "throughput": 5836.04, "total_tokens": 8353920} {"current_steps": 12820, "total_steps": 33920, "loss": 0.3481, "lr": 7.826006678355596e-06, "epoch": 7.558962264150943, "percentage": 37.79, "elapsed_time": "0:23:51", "remaining_time": "0:39:16", "throughput": 5836.01, "total_tokens": 8357024} {"current_steps": 12825, "total_steps": 33920, "loss": 0.3697, "lr": 7.823883936130817e-06, "epoch": 7.56191037735849, "percentage": 37.81, "elapsed_time": "0:23:52", "remaining_time": "0:39:16", "throughput": 5836.08, "total_tokens": 8360160} {"current_steps": 12830, "total_steps": 33920, "loss": 0.3563, "lr": 7.821760446270597e-06, "epoch": 7.564858490566038, "percentage": 37.82, "elapsed_time": "0:23:53", "remaining_time": "0:39:15", "throughput": 5835.98, "total_tokens": 8362976} {"current_steps": 12835, "total_steps": 33920, "loss": 0.3888, "lr": 7.819636209337136e-06, "epoch": 7.567806603773585, "percentage": 37.84, "elapsed_time": "0:23:53", "remaining_time": "0:39:14", "throughput": 5835.97, "total_tokens": 8365888} {"current_steps": 12840, "total_steps": 33920, "loss": 0.4236, "lr": 7.817511225892838e-06, "epoch": 7.570754716981132, "percentage": 37.85, "elapsed_time": "0:23:54", "remaining_time": "0:39:14", "throughput": 5836.06, "total_tokens": 8369120} {"current_steps": 12845, "total_steps": 33920, "loss": 0.4603, "lr": 7.8153854965003e-06, "epoch": 7.5737028301886795, "percentage": 37.87, "elapsed_time": "0:23:54", "remaining_time": "0:39:13", "throughput": 5836.48, "total_tokens": 8373376} {"current_steps": 12850, "total_steps": 33920, "loss": 0.3501, "lr": 7.813259021722319e-06, "epoch": 7.576650943396227, "percentage": 37.88, "elapsed_time": "0:23:55", "remaining_time": "0:39:13", "throughput": 5835.95, "total_tokens": 8375808} {"current_steps": 12855, "total_steps": 33920, "loss": 0.5657, "lr": 7.811131802121885e-06, "epoch": 7.579599056603773, "percentage": 37.9, "elapsed_time": "0:23:55", "remaining_time": "0:39:12", "throughput": 5835.96, "total_tokens": 8378720} {"current_steps": 12860, "total_steps": 33920, "loss": 0.3197, "lr": 7.809003838262193e-06, "epoch": 7.5825471698113205, "percentage": 37.91, "elapsed_time": "0:23:56", "remaining_time": "0:39:11", "throughput": 5836.08, "total_tokens": 8381728} {"current_steps": 12865, "total_steps": 33920, "loss": 0.4422, "lr": 7.806875130706628e-06, "epoch": 7.585495283018868, "percentage": 37.93, "elapsed_time": "0:23:56", "remaining_time": "0:39:11", "throughput": 5835.95, "total_tokens": 8384480} {"current_steps": 12870, "total_steps": 33920, "loss": 0.3221, "lr": 7.804745680018775e-06, "epoch": 7.588443396226415, "percentage": 37.94, "elapsed_time": "0:23:57", "remaining_time": "0:39:10", "throughput": 5835.8, "total_tokens": 8387104} {"current_steps": 12875, "total_steps": 33920, "loss": 0.3857, "lr": 7.802615486762418e-06, "epoch": 7.591391509433962, "percentage": 37.96, "elapsed_time": "0:23:57", "remaining_time": "0:39:10", "throughput": 5836.03, "total_tokens": 8390560} {"current_steps": 12880, "total_steps": 33920, "loss": 0.4363, "lr": 7.800484551501528e-06, "epoch": 7.59433962264151, "percentage": 37.97, "elapsed_time": "0:23:58", "remaining_time": "0:39:09", "throughput": 5835.98, "total_tokens": 8393472} {"current_steps": 12885, "total_steps": 33920, "loss": 0.4374, "lr": 7.798352874800285e-06, "epoch": 7.597287735849057, "percentage": 37.99, "elapsed_time": "0:23:58", "remaining_time": "0:39:08", "throughput": 5835.93, "total_tokens": 8396416} {"current_steps": 12890, "total_steps": 33920, "loss": 0.3626, "lr": 7.79622045722306e-06, "epoch": 7.600235849056604, "percentage": 38.0, "elapsed_time": "0:23:59", "remaining_time": "0:39:08", "throughput": 5836.21, "total_tokens": 8400096} {"current_steps": 12895, "total_steps": 33920, "loss": 0.3912, "lr": 7.794087299334416e-06, "epoch": 7.603183962264151, "percentage": 38.02, "elapsed_time": "0:23:59", "remaining_time": "0:39:07", "throughput": 5836.26, "total_tokens": 8403552} {"current_steps": 12900, "total_steps": 33920, "loss": 0.4015, "lr": 7.79195340169912e-06, "epoch": 7.606132075471698, "percentage": 38.03, "elapsed_time": "0:24:00", "remaining_time": "0:39:07", "throughput": 5836.52, "total_tokens": 8407648} {"current_steps": 12905, "total_steps": 33920, "loss": 0.471, "lr": 7.789818764882127e-06, "epoch": 7.609080188679245, "percentage": 38.05, "elapsed_time": "0:24:01", "remaining_time": "0:39:06", "throughput": 5836.59, "total_tokens": 8410720} {"current_steps": 12910, "total_steps": 33920, "loss": 0.31, "lr": 7.78768338944859e-06, "epoch": 7.6120283018867925, "percentage": 38.06, "elapsed_time": "0:24:01", "remaining_time": "0:39:05", "throughput": 5836.49, "total_tokens": 8413408} {"current_steps": 12915, "total_steps": 33920, "loss": 0.3788, "lr": 7.785547275963865e-06, "epoch": 7.61497641509434, "percentage": 38.07, "elapsed_time": "0:24:02", "remaining_time": "0:39:05", "throughput": 5836.53, "total_tokens": 8416768} {"current_steps": 12920, "total_steps": 33920, "loss": 0.3913, "lr": 7.783410424993492e-06, "epoch": 7.617924528301887, "percentage": 38.09, "elapsed_time": "0:24:02", "remaining_time": "0:39:04", "throughput": 5836.23, "total_tokens": 8419072} {"current_steps": 12925, "total_steps": 33920, "loss": 0.4123, "lr": 7.781272837103213e-06, "epoch": 7.620872641509434, "percentage": 38.1, "elapsed_time": "0:24:03", "remaining_time": "0:39:04", "throughput": 5836.18, "total_tokens": 8421728} {"current_steps": 12930, "total_steps": 33920, "loss": 0.3753, "lr": 7.779134512858964e-06, "epoch": 7.623820754716981, "percentage": 38.12, "elapsed_time": "0:24:03", "remaining_time": "0:39:03", "throughput": 5836.2, "total_tokens": 8425184} {"current_steps": 12935, "total_steps": 33920, "loss": 0.4383, "lr": 7.776995452826876e-06, "epoch": 7.626768867924528, "percentage": 38.13, "elapsed_time": "0:24:04", "remaining_time": "0:39:02", "throughput": 5836.2, "total_tokens": 8428256} {"current_steps": 12940, "total_steps": 33920, "loss": 0.4513, "lr": 7.774855657573274e-06, "epoch": 7.629716981132075, "percentage": 38.15, "elapsed_time": "0:24:04", "remaining_time": "0:39:02", "throughput": 5836.44, "total_tokens": 8431872} {"current_steps": 12945, "total_steps": 33920, "loss": 0.3603, "lr": 7.772715127664676e-06, "epoch": 7.632665094339623, "percentage": 38.16, "elapsed_time": "0:24:05", "remaining_time": "0:39:01", "throughput": 5836.4, "total_tokens": 8434656} {"current_steps": 12950, "total_steps": 33920, "loss": 0.3734, "lr": 7.7705738636678e-06, "epoch": 7.63561320754717, "percentage": 38.18, "elapsed_time": "0:24:05", "remaining_time": "0:39:01", "throughput": 5836.34, "total_tokens": 8437504} {"current_steps": 12955, "total_steps": 33920, "loss": 0.3585, "lr": 7.768431866149552e-06, "epoch": 7.638561320754717, "percentage": 38.19, "elapsed_time": "0:24:06", "remaining_time": "0:39:00", "throughput": 5836.57, "total_tokens": 8440960} {"current_steps": 12960, "total_steps": 33920, "loss": 0.4011, "lr": 7.766289135677035e-06, "epoch": 7.6415094339622645, "percentage": 38.21, "elapsed_time": "0:24:06", "remaining_time": "0:38:59", "throughput": 5836.6, "total_tokens": 8444128} {"current_steps": 12965, "total_steps": 33920, "loss": 0.498, "lr": 7.764145672817549e-06, "epoch": 7.644457547169811, "percentage": 38.22, "elapsed_time": "0:24:07", "remaining_time": "0:38:59", "throughput": 5837.0, "total_tokens": 8448192} {"current_steps": 12970, "total_steps": 33920, "loss": 0.4189, "lr": 7.762001478138583e-06, "epoch": 7.647405660377358, "percentage": 38.24, "elapsed_time": "0:24:07", "remaining_time": "0:38:58", "throughput": 5837.26, "total_tokens": 8451744} {"current_steps": 12975, "total_steps": 33920, "loss": 0.4304, "lr": 7.759856552207822e-06, "epoch": 7.650353773584905, "percentage": 38.25, "elapsed_time": "0:24:08", "remaining_time": "0:38:58", "throughput": 5837.29, "total_tokens": 8455040} {"current_steps": 12980, "total_steps": 33920, "loss": 0.3564, "lr": 7.757710895593144e-06, "epoch": 7.653301886792453, "percentage": 38.27, "elapsed_time": "0:24:08", "remaining_time": "0:38:57", "throughput": 5837.08, "total_tokens": 8457792} {"current_steps": 12985, "total_steps": 33920, "loss": 0.4801, "lr": 7.755564508862623e-06, "epoch": 7.65625, "percentage": 38.28, "elapsed_time": "0:24:09", "remaining_time": "0:38:57", "throughput": 5837.32, "total_tokens": 8461440} {"current_steps": 12990, "total_steps": 33920, "loss": 0.527, "lr": 7.753417392584522e-06, "epoch": 7.659198113207547, "percentage": 38.3, "elapsed_time": "0:24:10", "remaining_time": "0:38:56", "throughput": 5837.38, "total_tokens": 8464576} {"current_steps": 12995, "total_steps": 33920, "loss": 0.301, "lr": 7.751269547327298e-06, "epoch": 7.662146226415095, "percentage": 38.31, "elapsed_time": "0:24:10", "remaining_time": "0:38:55", "throughput": 5837.54, "total_tokens": 8468160} {"current_steps": 13000, "total_steps": 33920, "loss": 0.3607, "lr": 7.749120973659606e-06, "epoch": 7.665094339622642, "percentage": 38.33, "elapsed_time": "0:24:11", "remaining_time": "0:38:55", "throughput": 5837.6, "total_tokens": 8471296} {"current_steps": 13005, "total_steps": 33920, "loss": 0.3674, "lr": 7.746971672150286e-06, "epoch": 7.668042452830189, "percentage": 38.34, "elapsed_time": "0:24:11", "remaining_time": "0:38:54", "throughput": 5837.4, "total_tokens": 8473728} {"current_steps": 13010, "total_steps": 33920, "loss": 0.5391, "lr": 7.74482164336838e-06, "epoch": 7.6709905660377355, "percentage": 38.35, "elapsed_time": "0:24:12", "remaining_time": "0:38:54", "throughput": 5837.74, "total_tokens": 8477600} {"current_steps": 13015, "total_steps": 33920, "loss": 0.5365, "lr": 7.742670887883111e-06, "epoch": 7.673938679245283, "percentage": 38.37, "elapsed_time": "0:24:12", "remaining_time": "0:38:53", "throughput": 5837.86, "total_tokens": 8480704} {"current_steps": 13020, "total_steps": 33920, "loss": 0.3469, "lr": 7.740519406263905e-06, "epoch": 7.67688679245283, "percentage": 38.38, "elapsed_time": "0:24:13", "remaining_time": "0:38:52", "throughput": 5837.82, "total_tokens": 8483872} {"current_steps": 13025, "total_steps": 33920, "loss": 0.2866, "lr": 7.738367199080376e-06, "epoch": 7.679834905660377, "percentage": 38.4, "elapsed_time": "0:24:13", "remaining_time": "0:38:52", "throughput": 5837.93, "total_tokens": 8486848} {"current_steps": 13030, "total_steps": 33920, "loss": 0.57, "lr": 7.73621426690233e-06, "epoch": 7.682783018867925, "percentage": 38.41, "elapsed_time": "0:24:14", "remaining_time": "0:38:51", "throughput": 5837.92, "total_tokens": 8489536} {"current_steps": 13035, "total_steps": 33920, "loss": 0.4558, "lr": 7.734060610299764e-06, "epoch": 7.685731132075472, "percentage": 38.43, "elapsed_time": "0:24:14", "remaining_time": "0:38:50", "throughput": 5837.81, "total_tokens": 8492320} {"current_steps": 13040, "total_steps": 33920, "loss": 0.5196, "lr": 7.731906229842869e-06, "epoch": 7.688679245283019, "percentage": 38.44, "elapsed_time": "0:24:15", "remaining_time": "0:38:50", "throughput": 5837.89, "total_tokens": 8495328} {"current_steps": 13045, "total_steps": 33920, "loss": 0.4421, "lr": 7.729751126102023e-06, "epoch": 7.691627358490566, "percentage": 38.46, "elapsed_time": "0:24:15", "remaining_time": "0:38:49", "throughput": 5838.05, "total_tokens": 8498368} {"current_steps": 13050, "total_steps": 33920, "loss": 0.3836, "lr": 7.727595299647805e-06, "epoch": 7.694575471698113, "percentage": 38.47, "elapsed_time": "0:24:16", "remaining_time": "0:38:48", "throughput": 5838.21, "total_tokens": 8501632} {"current_steps": 13055, "total_steps": 33920, "loss": 0.3607, "lr": 7.725438751050973e-06, "epoch": 7.69752358490566, "percentage": 38.49, "elapsed_time": "0:24:16", "remaining_time": "0:38:48", "throughput": 5838.3, "total_tokens": 8504800} {"current_steps": 13060, "total_steps": 33920, "loss": 0.5088, "lr": 7.723281480882489e-06, "epoch": 7.7004716981132075, "percentage": 38.5, "elapsed_time": "0:24:17", "remaining_time": "0:38:47", "throughput": 5838.08, "total_tokens": 8507264} {"current_steps": 13065, "total_steps": 33920, "loss": 0.3502, "lr": 7.721123489713494e-06, "epoch": 7.703419811320755, "percentage": 38.52, "elapsed_time": "0:24:17", "remaining_time": "0:38:47", "throughput": 5838.26, "total_tokens": 8511040} {"current_steps": 13070, "total_steps": 33920, "loss": 0.394, "lr": 7.718964778115328e-06, "epoch": 7.706367924528302, "percentage": 38.53, "elapsed_time": "0:24:18", "remaining_time": "0:38:46", "throughput": 5838.21, "total_tokens": 8513952} {"current_steps": 13075, "total_steps": 33920, "loss": 0.4228, "lr": 7.716805346659519e-06, "epoch": 7.709316037735849, "percentage": 38.55, "elapsed_time": "0:24:18", "remaining_time": "0:38:45", "throughput": 5838.41, "total_tokens": 8517344} {"current_steps": 13080, "total_steps": 33920, "loss": 0.4467, "lr": 7.714645195917788e-06, "epoch": 7.712264150943396, "percentage": 38.56, "elapsed_time": "0:24:19", "remaining_time": "0:38:45", "throughput": 5838.36, "total_tokens": 8520448} {"current_steps": 13085, "total_steps": 33920, "loss": 0.4963, "lr": 7.712484326462038e-06, "epoch": 7.715212264150943, "percentage": 38.58, "elapsed_time": "0:24:19", "remaining_time": "0:38:44", "throughput": 5838.33, "total_tokens": 8523328} {"current_steps": 13090, "total_steps": 33920, "loss": 0.3976, "lr": 7.710322738864375e-06, "epoch": 7.71816037735849, "percentage": 38.59, "elapsed_time": "0:24:20", "remaining_time": "0:38:43", "throughput": 5838.51, "total_tokens": 8526816} {"current_steps": 13095, "total_steps": 33920, "loss": 0.4499, "lr": 7.708160433697085e-06, "epoch": 7.721108490566038, "percentage": 38.61, "elapsed_time": "0:24:20", "remaining_time": "0:38:43", "throughput": 5838.39, "total_tokens": 8529504} {"current_steps": 13100, "total_steps": 33920, "loss": 0.3348, "lr": 7.705997411532649e-06, "epoch": 7.724056603773585, "percentage": 38.62, "elapsed_time": "0:24:21", "remaining_time": "0:38:42", "throughput": 5838.5, "total_tokens": 8533056} {"current_steps": 13105, "total_steps": 33920, "loss": 0.4559, "lr": 7.703833672943735e-06, "epoch": 7.727004716981132, "percentage": 38.64, "elapsed_time": "0:24:22", "remaining_time": "0:38:42", "throughput": 5838.58, "total_tokens": 8536288} {"current_steps": 13110, "total_steps": 33920, "loss": 0.4687, "lr": 7.701669218503206e-06, "epoch": 7.7299528301886795, "percentage": 38.65, "elapsed_time": "0:24:22", "remaining_time": "0:38:41", "throughput": 5838.37, "total_tokens": 8538880} {"current_steps": 13115, "total_steps": 33920, "loss": 0.402, "lr": 7.699504048784106e-06, "epoch": 7.732900943396227, "percentage": 38.66, "elapsed_time": "0:24:23", "remaining_time": "0:38:41", "throughput": 5838.73, "total_tokens": 8544736} {"current_steps": 13120, "total_steps": 33920, "loss": 0.4157, "lr": 7.697338164359675e-06, "epoch": 7.735849056603773, "percentage": 38.68, "elapsed_time": "0:24:23", "remaining_time": "0:38:40", "throughput": 5838.55, "total_tokens": 8547136} {"current_steps": 13125, "total_steps": 33920, "loss": 0.3464, "lr": 7.69517156580334e-06, "epoch": 7.7387971698113205, "percentage": 38.69, "elapsed_time": "0:24:24", "remaining_time": "0:38:40", "throughput": 5838.44, "total_tokens": 8549984} {"current_steps": 13130, "total_steps": 33920, "loss": 0.4093, "lr": 7.693004253688716e-06, "epoch": 7.741745283018868, "percentage": 38.71, "elapsed_time": "0:24:25", "remaining_time": "0:38:39", "throughput": 5838.67, "total_tokens": 8553792} {"current_steps": 13135, "total_steps": 33920, "loss": 0.3818, "lr": 7.690836228589613e-06, "epoch": 7.744693396226415, "percentage": 38.72, "elapsed_time": "0:24:25", "remaining_time": "0:38:39", "throughput": 5838.65, "total_tokens": 8556480} {"current_steps": 13140, "total_steps": 33920, "loss": 0.4145, "lr": 7.688667491080019e-06, "epoch": 7.747641509433962, "percentage": 38.74, "elapsed_time": "0:24:26", "remaining_time": "0:38:38", "throughput": 5838.68, "total_tokens": 8559616} {"current_steps": 13145, "total_steps": 33920, "loss": 0.4131, "lr": 7.686498041734121e-06, "epoch": 7.75058962264151, "percentage": 38.75, "elapsed_time": "0:24:26", "remaining_time": "0:38:37", "throughput": 5838.55, "total_tokens": 8562400} {"current_steps": 13150, "total_steps": 33920, "loss": 0.4227, "lr": 7.684327881126285e-06, "epoch": 7.753537735849057, "percentage": 38.77, "elapsed_time": "0:24:27", "remaining_time": "0:38:37", "throughput": 5838.85, "total_tokens": 8566336} {"current_steps": 13155, "total_steps": 33920, "loss": 0.4486, "lr": 7.682157009831078e-06, "epoch": 7.756485849056604, "percentage": 38.78, "elapsed_time": "0:24:27", "remaining_time": "0:38:36", "throughput": 5839.22, "total_tokens": 8570976} {"current_steps": 13160, "total_steps": 33920, "loss": 0.4101, "lr": 7.67998542842324e-06, "epoch": 7.759433962264151, "percentage": 38.8, "elapsed_time": "0:24:28", "remaining_time": "0:38:36", "throughput": 5839.35, "total_tokens": 8574176} {"current_steps": 13165, "total_steps": 33920, "loss": 0.4454, "lr": 7.677813137477711e-06, "epoch": 7.762382075471698, "percentage": 38.81, "elapsed_time": "0:24:28", "remaining_time": "0:38:35", "throughput": 5839.24, "total_tokens": 8577120} {"current_steps": 13170, "total_steps": 33920, "loss": 0.441, "lr": 7.675640137569614e-06, "epoch": 7.765330188679245, "percentage": 38.83, "elapsed_time": "0:24:29", "remaining_time": "0:38:35", "throughput": 5839.08, "total_tokens": 8579936} {"current_steps": 13175, "total_steps": 33920, "loss": 0.5256, "lr": 7.673466429274257e-06, "epoch": 7.7682783018867925, "percentage": 38.84, "elapsed_time": "0:24:29", "remaining_time": "0:38:34", "throughput": 5838.8, "total_tokens": 8582304} {"current_steps": 13180, "total_steps": 33920, "loss": 0.3135, "lr": 7.671292013167143e-06, "epoch": 7.77122641509434, "percentage": 38.86, "elapsed_time": "0:24:30", "remaining_time": "0:38:33", "throughput": 5838.9, "total_tokens": 8585184} {"current_steps": 13185, "total_steps": 33920, "loss": 0.4471, "lr": 7.669116889823955e-06, "epoch": 7.774174528301887, "percentage": 38.87, "elapsed_time": "0:24:30", "remaining_time": "0:38:33", "throughput": 5838.9, "total_tokens": 8588128} {"current_steps": 13190, "total_steps": 33920, "loss": 0.3611, "lr": 7.666941059820567e-06, "epoch": 7.777122641509434, "percentage": 38.89, "elapsed_time": "0:24:31", "remaining_time": "0:38:32", "throughput": 5839.0, "total_tokens": 8591808} {"current_steps": 13195, "total_steps": 33920, "loss": 0.4664, "lr": 7.66476452373304e-06, "epoch": 7.780070754716981, "percentage": 38.9, "elapsed_time": "0:24:31", "remaining_time": "0:38:31", "throughput": 5839.08, "total_tokens": 8594752} {"current_steps": 13200, "total_steps": 33920, "loss": 0.3859, "lr": 7.66258728213762e-06, "epoch": 7.783018867924528, "percentage": 38.92, "elapsed_time": "0:24:32", "remaining_time": "0:38:31", "throughput": 5839.27, "total_tokens": 8598304} {"current_steps": 13205, "total_steps": 33920, "loss": 0.3913, "lr": 7.66040933561074e-06, "epoch": 7.785966981132075, "percentage": 38.93, "elapsed_time": "0:24:32", "remaining_time": "0:38:30", "throughput": 5839.13, "total_tokens": 8600992} {"current_steps": 13210, "total_steps": 33920, "loss": 0.4422, "lr": 7.658230684729027e-06, "epoch": 7.788915094339623, "percentage": 38.94, "elapsed_time": "0:24:34", "remaining_time": "0:38:30", "throughput": 5839.69, "total_tokens": 8608192} {"current_steps": 13215, "total_steps": 33920, "loss": 0.3475, "lr": 7.656051330069282e-06, "epoch": 7.79186320754717, "percentage": 38.96, "elapsed_time": "0:24:34", "remaining_time": "0:38:30", "throughput": 5840.02, "total_tokens": 8612576} {"current_steps": 13220, "total_steps": 33920, "loss": 0.4225, "lr": 7.6538712722085e-06, "epoch": 7.794811320754717, "percentage": 38.97, "elapsed_time": "0:24:35", "remaining_time": "0:38:29", "throughput": 5840.15, "total_tokens": 8615680} {"current_steps": 13225, "total_steps": 33920, "loss": 0.3988, "lr": 7.651690511723862e-06, "epoch": 7.7977594339622645, "percentage": 38.99, "elapsed_time": "0:24:35", "remaining_time": "0:38:29", "throughput": 5839.82, "total_tokens": 8618080} {"current_steps": 13230, "total_steps": 33920, "loss": 0.2902, "lr": 7.64950904919273e-06, "epoch": 7.800707547169811, "percentage": 39.0, "elapsed_time": "0:24:36", "remaining_time": "0:38:28", "throughput": 5839.75, "total_tokens": 8620608} {"current_steps": 13235, "total_steps": 33920, "loss": 0.5519, "lr": 7.647326885192662e-06, "epoch": 7.803655660377358, "percentage": 39.02, "elapsed_time": "0:24:36", "remaining_time": "0:38:27", "throughput": 5839.72, "total_tokens": 8623424} {"current_steps": 13240, "total_steps": 33920, "loss": 0.5043, "lr": 7.645144020301392e-06, "epoch": 7.806603773584905, "percentage": 39.03, "elapsed_time": "0:24:37", "remaining_time": "0:38:27", "throughput": 5840.08, "total_tokens": 8627360} {"current_steps": 13245, "total_steps": 33920, "loss": 0.4525, "lr": 7.64296045509684e-06, "epoch": 7.809551886792453, "percentage": 39.05, "elapsed_time": "0:24:37", "remaining_time": "0:38:26", "throughput": 5839.91, "total_tokens": 8629888} {"current_steps": 13250, "total_steps": 33920, "loss": 0.5715, "lr": 7.64077619015712e-06, "epoch": 7.8125, "percentage": 39.06, "elapsed_time": "0:24:38", "remaining_time": "0:38:26", "throughput": 5840.13, "total_tokens": 8633408} {"current_steps": 13255, "total_steps": 33920, "loss": 0.4835, "lr": 7.638591226060519e-06, "epoch": 7.815448113207547, "percentage": 39.08, "elapsed_time": "0:24:38", "remaining_time": "0:38:25", "throughput": 5840.26, "total_tokens": 8636512} {"current_steps": 13260, "total_steps": 33920, "loss": 0.4835, "lr": 7.636405563385522e-06, "epoch": 7.818396226415095, "percentage": 39.09, "elapsed_time": "0:24:39", "remaining_time": "0:38:24", "throughput": 5840.47, "total_tokens": 8640320} {"current_steps": 13265, "total_steps": 33920, "loss": 0.5227, "lr": 7.634219202710789e-06, "epoch": 7.821344339622642, "percentage": 39.11, "elapsed_time": "0:24:39", "remaining_time": "0:38:24", "throughput": 5840.67, "total_tokens": 8643872} {"current_steps": 13270, "total_steps": 33920, "loss": 0.2569, "lr": 7.632032144615168e-06, "epoch": 7.824292452830189, "percentage": 39.12, "elapsed_time": "0:24:40", "remaining_time": "0:38:23", "throughput": 5840.68, "total_tokens": 8646880} {"current_steps": 13275, "total_steps": 33920, "loss": 0.4049, "lr": 7.629844389677695e-06, "epoch": 7.8272405660377355, "percentage": 39.14, "elapsed_time": "0:24:40", "remaining_time": "0:38:23", "throughput": 5840.68, "total_tokens": 8649568} {"current_steps": 13280, "total_steps": 33920, "loss": 0.3216, "lr": 7.627655938477586e-06, "epoch": 7.830188679245283, "percentage": 39.15, "elapsed_time": "0:24:41", "remaining_time": "0:38:22", "throughput": 5840.8, "total_tokens": 8652672} {"current_steps": 13285, "total_steps": 33920, "loss": 0.3919, "lr": 7.6254667915942415e-06, "epoch": 7.83313679245283, "percentage": 39.17, "elapsed_time": "0:24:41", "remaining_time": "0:38:21", "throughput": 5840.93, "total_tokens": 8656192} {"current_steps": 13290, "total_steps": 33920, "loss": 0.455, "lr": 7.62327694960725e-06, "epoch": 7.836084905660377, "percentage": 39.18, "elapsed_time": "0:24:42", "remaining_time": "0:38:21", "throughput": 5841.13, "total_tokens": 8659776} {"current_steps": 13295, "total_steps": 33920, "loss": 0.4131, "lr": 7.621086413096379e-06, "epoch": 7.839033018867925, "percentage": 39.2, "elapsed_time": "0:24:43", "remaining_time": "0:38:20", "throughput": 5841.08, "total_tokens": 8662688} {"current_steps": 13300, "total_steps": 33920, "loss": 0.3886, "lr": 7.618895182641584e-06, "epoch": 7.841981132075472, "percentage": 39.21, "elapsed_time": "0:24:43", "remaining_time": "0:38:20", "throughput": 5841.1, "total_tokens": 8665760} {"current_steps": 13305, "total_steps": 33920, "loss": 0.5656, "lr": 7.6167032588230035e-06, "epoch": 7.844929245283019, "percentage": 39.22, "elapsed_time": "0:24:44", "remaining_time": "0:38:19", "throughput": 5841.28, "total_tokens": 8669280} {"current_steps": 13310, "total_steps": 33920, "loss": 0.3872, "lr": 7.614510642220958e-06, "epoch": 7.847877358490566, "percentage": 39.24, "elapsed_time": "0:24:44", "remaining_time": "0:38:19", "throughput": 5841.57, "total_tokens": 8673184} {"current_steps": 13315, "total_steps": 33920, "loss": 0.3348, "lr": 7.612317333415951e-06, "epoch": 7.850825471698113, "percentage": 39.25, "elapsed_time": "0:24:45", "remaining_time": "0:38:18", "throughput": 5841.7, "total_tokens": 8676640} {"current_steps": 13320, "total_steps": 33920, "loss": 0.5106, "lr": 7.610123332988673e-06, "epoch": 7.85377358490566, "percentage": 39.27, "elapsed_time": "0:24:45", "remaining_time": "0:38:17", "throughput": 5841.75, "total_tokens": 8679744} {"current_steps": 13325, "total_steps": 33920, "loss": 0.3815, "lr": 7.607928641519992e-06, "epoch": 7.8567216981132075, "percentage": 39.28, "elapsed_time": "0:24:46", "remaining_time": "0:38:17", "throughput": 5841.82, "total_tokens": 8682752} {"current_steps": 13330, "total_steps": 33920, "loss": 0.4225, "lr": 7.605733259590964e-06, "epoch": 7.859669811320755, "percentage": 39.3, "elapsed_time": "0:24:46", "remaining_time": "0:38:16", "throughput": 5841.76, "total_tokens": 8685472} {"current_steps": 13335, "total_steps": 33920, "loss": 0.3393, "lr": 7.603537187782826e-06, "epoch": 7.862617924528302, "percentage": 39.31, "elapsed_time": "0:24:47", "remaining_time": "0:38:16", "throughput": 5842.13, "total_tokens": 8689632} {"current_steps": 13340, "total_steps": 33920, "loss": 0.4447, "lr": 7.601340426676996e-06, "epoch": 7.865566037735849, "percentage": 39.33, "elapsed_time": "0:24:47", "remaining_time": "0:38:15", "throughput": 5842.4, "total_tokens": 8693440} {"current_steps": 13345, "total_steps": 33920, "loss": 0.3355, "lr": 7.599142976855077e-06, "epoch": 7.868514150943396, "percentage": 39.34, "elapsed_time": "0:24:48", "remaining_time": "0:38:14", "throughput": 5842.63, "total_tokens": 8696960} {"current_steps": 13350, "total_steps": 33920, "loss": 0.3982, "lr": 7.596944838898854e-06, "epoch": 7.871462264150943, "percentage": 39.36, "elapsed_time": "0:24:49", "remaining_time": "0:38:14", "throughput": 5842.89, "total_tokens": 8700864} {"current_steps": 13355, "total_steps": 33920, "loss": 0.432, "lr": 7.594746013390293e-06, "epoch": 7.87441037735849, "percentage": 39.37, "elapsed_time": "0:24:49", "remaining_time": "0:38:13", "throughput": 5842.89, "total_tokens": 8703904} {"current_steps": 13360, "total_steps": 33920, "loss": 0.4019, "lr": 7.59254650091154e-06, "epoch": 7.877358490566038, "percentage": 39.39, "elapsed_time": "0:24:50", "remaining_time": "0:38:13", "throughput": 5842.94, "total_tokens": 8707552} {"current_steps": 13365, "total_steps": 33920, "loss": 0.3984, "lr": 7.59034630204493e-06, "epoch": 7.880306603773585, "percentage": 39.4, "elapsed_time": "0:24:50", "remaining_time": "0:38:12", "throughput": 5843.01, "total_tokens": 8710464} {"current_steps": 13370, "total_steps": 33920, "loss": 0.3975, "lr": 7.588145417372972e-06, "epoch": 7.883254716981132, "percentage": 39.42, "elapsed_time": "0:24:51", "remaining_time": "0:38:12", "throughput": 5842.95, "total_tokens": 8713216} {"current_steps": 13375, "total_steps": 33920, "loss": 0.4141, "lr": 7.585943847478361e-06, "epoch": 7.8862028301886795, "percentage": 39.43, "elapsed_time": "0:24:51", "remaining_time": "0:38:11", "throughput": 5843.05, "total_tokens": 8716512} {"current_steps": 13380, "total_steps": 33920, "loss": 0.3418, "lr": 7.583741592943971e-06, "epoch": 7.889150943396227, "percentage": 39.45, "elapsed_time": "0:24:52", "remaining_time": "0:38:10", "throughput": 5843.2, "total_tokens": 8719840} {"current_steps": 13385, "total_steps": 33920, "loss": 0.3369, "lr": 7.581538654352859e-06, "epoch": 7.892099056603773, "percentage": 39.46, "elapsed_time": "0:24:52", "remaining_time": "0:38:10", "throughput": 5843.46, "total_tokens": 8723296} {"current_steps": 13390, "total_steps": 33920, "loss": 0.4314, "lr": 7.579335032288262e-06, "epoch": 7.8950471698113205, "percentage": 39.48, "elapsed_time": "0:24:53", "remaining_time": "0:38:09", "throughput": 5843.61, "total_tokens": 8726272} {"current_steps": 13395, "total_steps": 33920, "loss": 0.3827, "lr": 7.577130727333598e-06, "epoch": 7.897995283018868, "percentage": 39.49, "elapsed_time": "0:24:53", "remaining_time": "0:38:08", "throughput": 5843.68, "total_tokens": 8729216} {"current_steps": 13400, "total_steps": 33920, "loss": 0.4882, "lr": 7.5749257400724695e-06, "epoch": 7.900943396226415, "percentage": 39.5, "elapsed_time": "0:24:54", "remaining_time": "0:38:08", "throughput": 5843.46, "total_tokens": 8731648} {"current_steps": 13405, "total_steps": 33920, "loss": 0.4285, "lr": 7.572720071088653e-06, "epoch": 7.903891509433962, "percentage": 39.52, "elapsed_time": "0:24:54", "remaining_time": "0:38:07", "throughput": 5843.55, "total_tokens": 8735104} {"current_steps": 13410, "total_steps": 33920, "loss": 0.4292, "lr": 7.570513720966108e-06, "epoch": 7.90683962264151, "percentage": 39.53, "elapsed_time": "0:24:55", "remaining_time": "0:38:07", "throughput": 5843.76, "total_tokens": 8738432} {"current_steps": 13415, "total_steps": 33920, "loss": 0.3657, "lr": 7.56830669028898e-06, "epoch": 7.909787735849057, "percentage": 39.55, "elapsed_time": "0:24:55", "remaining_time": "0:38:06", "throughput": 5843.97, "total_tokens": 8742080} {"current_steps": 13420, "total_steps": 33920, "loss": 0.4759, "lr": 7.566098979641588e-06, "epoch": 7.912735849056604, "percentage": 39.56, "elapsed_time": "0:24:56", "remaining_time": "0:38:05", "throughput": 5844.07, "total_tokens": 8745120} {"current_steps": 13425, "total_steps": 33920, "loss": 0.4181, "lr": 7.563890589608427e-06, "epoch": 7.915683962264151, "percentage": 39.58, "elapsed_time": "0:24:57", "remaining_time": "0:38:05", "throughput": 5844.27, "total_tokens": 8750592} {"current_steps": 13430, "total_steps": 33920, "loss": 0.4343, "lr": 7.561681520774187e-06, "epoch": 7.918632075471698, "percentage": 39.59, "elapsed_time": "0:24:57", "remaining_time": "0:38:05", "throughput": 5844.68, "total_tokens": 8754432} {"current_steps": 13435, "total_steps": 33920, "loss": 0.5774, "lr": 7.559471773723721e-06, "epoch": 7.921580188679245, "percentage": 39.61, "elapsed_time": "0:24:58", "remaining_time": "0:38:04", "throughput": 5844.96, "total_tokens": 8758016} {"current_steps": 13440, "total_steps": 33920, "loss": 0.3994, "lr": 7.557261349042073e-06, "epoch": 7.9245283018867925, "percentage": 39.62, "elapsed_time": "0:24:58", "remaining_time": "0:38:03", "throughput": 5844.87, "total_tokens": 8760544} {"current_steps": 13445, "total_steps": 33920, "loss": 0.4744, "lr": 7.555050247314464e-06, "epoch": 7.92747641509434, "percentage": 39.64, "elapsed_time": "0:24:59", "remaining_time": "0:38:03", "throughput": 5845.4, "total_tokens": 8765792} {"current_steps": 13450, "total_steps": 33920, "loss": 0.3427, "lr": 7.552838469126289e-06, "epoch": 7.930424528301887, "percentage": 39.65, "elapsed_time": "0:25:00", "remaining_time": "0:38:03", "throughput": 5845.41, "total_tokens": 8768608} {"current_steps": 13455, "total_steps": 33920, "loss": 0.3828, "lr": 7.550626015063125e-06, "epoch": 7.933372641509434, "percentage": 39.67, "elapsed_time": "0:25:00", "remaining_time": "0:38:02", "throughput": 5845.49, "total_tokens": 8771680} {"current_steps": 13460, "total_steps": 33920, "loss": 0.3649, "lr": 7.548412885710734e-06, "epoch": 7.936320754716981, "percentage": 39.68, "elapsed_time": "0:25:01", "remaining_time": "0:38:01", "throughput": 5845.62, "total_tokens": 8774720} {"current_steps": 13465, "total_steps": 33920, "loss": 0.3616, "lr": 7.546199081655048e-06, "epoch": 7.939268867924528, "percentage": 39.7, "elapsed_time": "0:25:01", "remaining_time": "0:38:01", "throughput": 5845.74, "total_tokens": 8778080} {"current_steps": 13470, "total_steps": 33920, "loss": 0.5237, "lr": 7.54398460348218e-06, "epoch": 7.942216981132075, "percentage": 39.71, "elapsed_time": "0:25:02", "remaining_time": "0:38:00", "throughput": 5845.74, "total_tokens": 8781568} {"current_steps": 13475, "total_steps": 33920, "loss": 0.4307, "lr": 7.541769451778425e-06, "epoch": 7.945165094339623, "percentage": 39.73, "elapsed_time": "0:25:02", "remaining_time": "0:38:00", "throughput": 5845.79, "total_tokens": 8784768} {"current_steps": 13480, "total_steps": 33920, "loss": 0.3514, "lr": 7.5395536271302536e-06, "epoch": 7.94811320754717, "percentage": 39.74, "elapsed_time": "0:25:03", "remaining_time": "0:37:59", "throughput": 5845.96, "total_tokens": 8788032} {"current_steps": 13485, "total_steps": 33920, "loss": 0.3308, "lr": 7.5373371301243136e-06, "epoch": 7.951061320754717, "percentage": 39.76, "elapsed_time": "0:25:04", "remaining_time": "0:37:59", "throughput": 5846.57, "total_tokens": 8793408} {"current_steps": 13490, "total_steps": 33920, "loss": 0.3728, "lr": 7.535119961347433e-06, "epoch": 7.9540094339622645, "percentage": 39.77, "elapsed_time": "0:25:04", "remaining_time": "0:37:58", "throughput": 5846.66, "total_tokens": 8796704} {"current_steps": 13495, "total_steps": 33920, "loss": 0.3715, "lr": 7.532902121386618e-06, "epoch": 7.956957547169811, "percentage": 39.78, "elapsed_time": "0:25:05", "remaining_time": "0:37:58", "throughput": 5846.95, "total_tokens": 8800448} {"current_steps": 13500, "total_steps": 33920, "loss": 0.5002, "lr": 7.530683610829051e-06, "epoch": 7.959905660377358, "percentage": 39.8, "elapsed_time": "0:25:05", "remaining_time": "0:37:57", "throughput": 5846.85, "total_tokens": 8803296} {"current_steps": 13505, "total_steps": 33920, "loss": 0.4646, "lr": 7.5284644302620906e-06, "epoch": 7.962853773584905, "percentage": 39.81, "elapsed_time": "0:25:06", "remaining_time": "0:37:56", "throughput": 5846.75, "total_tokens": 8805984} {"current_steps": 13510, "total_steps": 33920, "loss": 0.5778, "lr": 7.526244580273274e-06, "epoch": 7.965801886792453, "percentage": 39.83, "elapsed_time": "0:25:06", "remaining_time": "0:37:56", "throughput": 5847.27, "total_tokens": 8811072} {"current_steps": 13515, "total_steps": 33920, "loss": 0.3653, "lr": 7.524024061450318e-06, "epoch": 7.96875, "percentage": 39.84, "elapsed_time": "0:25:07", "remaining_time": "0:37:55", "throughput": 5847.37, "total_tokens": 8814144} {"current_steps": 13520, "total_steps": 33920, "loss": 0.4454, "lr": 7.521802874381115e-06, "epoch": 7.971698113207547, "percentage": 39.86, "elapsed_time": "0:25:07", "remaining_time": "0:37:55", "throughput": 5847.32, "total_tokens": 8816928} {"current_steps": 13525, "total_steps": 33920, "loss": 0.4588, "lr": 7.519581019653731e-06, "epoch": 7.974646226415095, "percentage": 39.87, "elapsed_time": "0:25:08", "remaining_time": "0:37:54", "throughput": 5846.95, "total_tokens": 8819168} {"current_steps": 13530, "total_steps": 33920, "loss": 0.4142, "lr": 7.517358497856413e-06, "epoch": 7.977594339622642, "percentage": 39.89, "elapsed_time": "0:25:08", "remaining_time": "0:37:53", "throughput": 5847.2, "total_tokens": 8822688} {"current_steps": 13535, "total_steps": 33920, "loss": 0.3912, "lr": 7.515135309577584e-06, "epoch": 7.980542452830189, "percentage": 39.9, "elapsed_time": "0:25:09", "remaining_time": "0:37:53", "throughput": 5847.27, "total_tokens": 8825952} {"current_steps": 13540, "total_steps": 33920, "loss": 0.5284, "lr": 7.5129114554058425e-06, "epoch": 7.9834905660377355, "percentage": 39.92, "elapsed_time": "0:25:09", "remaining_time": "0:37:52", "throughput": 5847.25, "total_tokens": 8829184} {"current_steps": 13545, "total_steps": 33920, "loss": 0.4749, "lr": 7.510686935929963e-06, "epoch": 7.986438679245283, "percentage": 39.93, "elapsed_time": "0:25:10", "remaining_time": "0:37:52", "throughput": 5847.45, "total_tokens": 8832768} {"current_steps": 13550, "total_steps": 33920, "loss": 0.3945, "lr": 7.5084617517388965e-06, "epoch": 7.98938679245283, "percentage": 39.95, "elapsed_time": "0:25:11", "remaining_time": "0:37:51", "throughput": 5847.42, "total_tokens": 8835744} {"current_steps": 13555, "total_steps": 33920, "loss": 0.4586, "lr": 7.506235903421771e-06, "epoch": 7.992334905660377, "percentage": 39.96, "elapsed_time": "0:25:11", "remaining_time": "0:37:51", "throughput": 5847.58, "total_tokens": 8839232} {"current_steps": 13560, "total_steps": 33920, "loss": 0.3999, "lr": 7.504009391567889e-06, "epoch": 7.995283018867925, "percentage": 39.98, "elapsed_time": "0:25:12", "remaining_time": "0:37:50", "throughput": 5847.79, "total_tokens": 8842720} {"current_steps": 13565, "total_steps": 33920, "loss": 0.3557, "lr": 7.501782216766729e-06, "epoch": 7.998231132075472, "percentage": 39.99, "elapsed_time": "0:25:12", "remaining_time": "0:37:49", "throughput": 5847.94, "total_tokens": 8845792} {"current_steps": 13568, "total_steps": 33920, "eval_loss": 0.5099420547485352, "epoch": 8.0, "percentage": 40.0, "elapsed_time": "0:25:32", "remaining_time": "0:38:18", "throughput": 5774.61, "total_tokens": 8848168} {"current_steps": 13570, "total_steps": 33920, "loss": 0.429, "lr": 7.499554379607944e-06, "epoch": 8.00117924528302, "percentage": 40.01, "elapsed_time": "0:25:35", "remaining_time": "0:38:23", "throughput": 5761.95, "total_tokens": 8849256} {"current_steps": 13575, "total_steps": 33920, "loss": 0.3561, "lr": 7.497325880681365e-06, "epoch": 8.004127358490566, "percentage": 40.02, "elapsed_time": "0:25:36", "remaining_time": "0:38:22", "throughput": 5762.11, "total_tokens": 8852584} {"current_steps": 13580, "total_steps": 33920, "loss": 0.4698, "lr": 7.495096720576994e-06, "epoch": 8.007075471698114, "percentage": 40.04, "elapsed_time": "0:25:36", "remaining_time": "0:38:21", "throughput": 5762.11, "total_tokens": 8855496} {"current_steps": 13585, "total_steps": 33920, "loss": 0.3735, "lr": 7.492866899885017e-06, "epoch": 8.01002358490566, "percentage": 40.05, "elapsed_time": "0:25:37", "remaining_time": "0:38:21", "throughput": 5762.0, "total_tokens": 8858056} {"current_steps": 13590, "total_steps": 33920, "loss": 0.5267, "lr": 7.490636419195782e-06, "epoch": 8.012971698113208, "percentage": 40.06, "elapsed_time": "0:25:38", "remaining_time": "0:38:20", "throughput": 5762.67, "total_tokens": 8863240} {"current_steps": 13595, "total_steps": 33920, "loss": 0.4313, "lr": 7.488405279099821e-06, "epoch": 8.015919811320755, "percentage": 40.08, "elapsed_time": "0:25:38", "remaining_time": "0:38:20", "throughput": 5762.85, "total_tokens": 8866536} {"current_steps": 13600, "total_steps": 33920, "loss": 0.4359, "lr": 7.48617348018784e-06, "epoch": 8.018867924528301, "percentage": 40.09, "elapsed_time": "0:25:39", "remaining_time": "0:38:19", "throughput": 5762.65, "total_tokens": 8869000} {"current_steps": 13605, "total_steps": 33920, "loss": 0.3305, "lr": 7.4839410230507134e-06, "epoch": 8.02181603773585, "percentage": 40.11, "elapsed_time": "0:25:39", "remaining_time": "0:38:18", "throughput": 5762.4, "total_tokens": 8871656} {"current_steps": 13610, "total_steps": 33920, "loss": 0.3883, "lr": 7.481707908279496e-06, "epoch": 8.024764150943396, "percentage": 40.12, "elapsed_time": "0:25:40", "remaining_time": "0:38:18", "throughput": 5762.52, "total_tokens": 8874792} {"current_steps": 13615, "total_steps": 33920, "loss": 0.2673, "lr": 7.4794741364654144e-06, "epoch": 8.027712264150944, "percentage": 40.14, "elapsed_time": "0:25:40", "remaining_time": "0:38:17", "throughput": 5762.6, "total_tokens": 8877896} {"current_steps": 13620, "total_steps": 33920, "loss": 0.4106, "lr": 7.477239708199871e-06, "epoch": 8.03066037735849, "percentage": 40.15, "elapsed_time": "0:25:41", "remaining_time": "0:38:17", "throughput": 5762.6, "total_tokens": 8881096} {"current_steps": 13625, "total_steps": 33920, "loss": 0.362, "lr": 7.475004624074434e-06, "epoch": 8.033608490566039, "percentage": 40.17, "elapsed_time": "0:25:41", "remaining_time": "0:38:16", "throughput": 5762.39, "total_tokens": 8883496} {"current_steps": 13630, "total_steps": 33920, "loss": 0.5068, "lr": 7.4727688846808595e-06, "epoch": 8.036556603773585, "percentage": 40.18, "elapsed_time": "0:25:42", "remaining_time": "0:38:15", "throughput": 5762.63, "total_tokens": 8886856} {"current_steps": 13635, "total_steps": 33920, "loss": 0.4106, "lr": 7.4705324906110654e-06, "epoch": 8.039504716981131, "percentage": 40.2, "elapsed_time": "0:25:42", "remaining_time": "0:38:15", "throughput": 5762.75, "total_tokens": 8890280} {"current_steps": 13640, "total_steps": 33920, "loss": 0.4369, "lr": 7.4682954424571466e-06, "epoch": 8.04245283018868, "percentage": 40.21, "elapsed_time": "0:25:43", "remaining_time": "0:38:14", "throughput": 5762.91, "total_tokens": 8893384} {"current_steps": 13645, "total_steps": 33920, "loss": 0.5718, "lr": 7.466057740811372e-06, "epoch": 8.045400943396226, "percentage": 40.23, "elapsed_time": "0:25:43", "remaining_time": "0:38:13", "throughput": 5762.85, "total_tokens": 8896136} {"current_steps": 13650, "total_steps": 33920, "loss": 0.4577, "lr": 7.463819386266182e-06, "epoch": 8.048349056603774, "percentage": 40.24, "elapsed_time": "0:25:44", "remaining_time": "0:38:13", "throughput": 5763.07, "total_tokens": 8899944} {"current_steps": 13655, "total_steps": 33920, "loss": 0.3305, "lr": 7.461580379414191e-06, "epoch": 8.05129716981132, "percentage": 40.26, "elapsed_time": "0:25:44", "remaining_time": "0:38:12", "throughput": 5763.23, "total_tokens": 8903400} {"current_steps": 13660, "total_steps": 33920, "loss": 0.3973, "lr": 7.459340720848187e-06, "epoch": 8.054245283018869, "percentage": 40.27, "elapsed_time": "0:25:45", "remaining_time": "0:38:12", "throughput": 5763.44, "total_tokens": 8906856} {"current_steps": 13665, "total_steps": 33920, "loss": 0.3616, "lr": 7.457100411161128e-06, "epoch": 8.057193396226415, "percentage": 40.29, "elapsed_time": "0:25:45", "remaining_time": "0:38:11", "throughput": 5763.35, "total_tokens": 8909832} {"current_steps": 13670, "total_steps": 33920, "loss": 0.5317, "lr": 7.454859450946144e-06, "epoch": 8.060141509433961, "percentage": 40.3, "elapsed_time": "0:25:46", "remaining_time": "0:38:10", "throughput": 5763.38, "total_tokens": 8912904} {"current_steps": 13675, "total_steps": 33920, "loss": 0.4443, "lr": 7.4526178407965396e-06, "epoch": 8.06308962264151, "percentage": 40.32, "elapsed_time": "0:25:47", "remaining_time": "0:38:10", "throughput": 5763.53, "total_tokens": 8916200} {"current_steps": 13680, "total_steps": 33920, "loss": 0.4242, "lr": 7.450375581305794e-06, "epoch": 8.066037735849056, "percentage": 40.33, "elapsed_time": "0:25:47", "remaining_time": "0:38:09", "throughput": 5763.44, "total_tokens": 8919272} {"current_steps": 13685, "total_steps": 33920, "loss": 0.3985, "lr": 7.448132673067552e-06, "epoch": 8.068985849056604, "percentage": 40.34, "elapsed_time": "0:25:48", "remaining_time": "0:38:09", "throughput": 5763.67, "total_tokens": 8923272} {"current_steps": 13690, "total_steps": 33920, "loss": 0.6907, "lr": 7.445889116675634e-06, "epoch": 8.07193396226415, "percentage": 40.36, "elapsed_time": "0:25:48", "remaining_time": "0:38:08", "throughput": 5764.01, "total_tokens": 8927528} {"current_steps": 13695, "total_steps": 33920, "loss": 0.3503, "lr": 7.443644912724031e-06, "epoch": 8.074882075471699, "percentage": 40.37, "elapsed_time": "0:25:49", "remaining_time": "0:38:08", "throughput": 5763.81, "total_tokens": 8929992} {"current_steps": 13700, "total_steps": 33920, "loss": 0.4373, "lr": 7.441400061806907e-06, "epoch": 8.077830188679245, "percentage": 40.39, "elapsed_time": "0:25:49", "remaining_time": "0:38:07", "throughput": 5763.99, "total_tokens": 8933864} {"current_steps": 13705, "total_steps": 33920, "loss": 0.5058, "lr": 7.439154564518592e-06, "epoch": 8.080778301886792, "percentage": 40.4, "elapsed_time": "0:25:50", "remaining_time": "0:38:07", "throughput": 5764.19, "total_tokens": 8937832} {"current_steps": 13710, "total_steps": 33920, "loss": 0.3998, "lr": 7.436908421453597e-06, "epoch": 8.08372641509434, "percentage": 40.42, "elapsed_time": "0:25:51", "remaining_time": "0:38:06", "throughput": 5764.33, "total_tokens": 8941224} {"current_steps": 13715, "total_steps": 33920, "loss": 0.3248, "lr": 7.434661633206593e-06, "epoch": 8.086674528301886, "percentage": 40.43, "elapsed_time": "0:25:51", "remaining_time": "0:38:05", "throughput": 5764.37, "total_tokens": 8944168} {"current_steps": 13720, "total_steps": 33920, "loss": 0.3541, "lr": 7.4324142003724286e-06, "epoch": 8.089622641509434, "percentage": 40.45, "elapsed_time": "0:25:52", "remaining_time": "0:38:05", "throughput": 5764.3, "total_tokens": 8946792} {"current_steps": 13725, "total_steps": 33920, "loss": 0.4109, "lr": 7.430166123546122e-06, "epoch": 8.09257075471698, "percentage": 40.46, "elapsed_time": "0:25:52", "remaining_time": "0:38:04", "throughput": 5764.5, "total_tokens": 8950216} {"current_steps": 13730, "total_steps": 33920, "loss": 0.4462, "lr": 7.427917403322862e-06, "epoch": 8.095518867924529, "percentage": 40.48, "elapsed_time": "0:25:53", "remaining_time": "0:38:04", "throughput": 5764.84, "total_tokens": 8954312} {"current_steps": 13735, "total_steps": 33920, "loss": 0.4719, "lr": 7.425668040298003e-06, "epoch": 8.098466981132075, "percentage": 40.49, "elapsed_time": "0:25:53", "remaining_time": "0:38:03", "throughput": 5765.17, "total_tokens": 8958376} {"current_steps": 13740, "total_steps": 33920, "loss": 0.336, "lr": 7.4234180350670785e-06, "epoch": 8.101415094339623, "percentage": 40.51, "elapsed_time": "0:25:54", "remaining_time": "0:38:02", "throughput": 5765.18, "total_tokens": 8961384} {"current_steps": 13745, "total_steps": 33920, "loss": 0.3946, "lr": 7.421167388225785e-06, "epoch": 8.10436320754717, "percentage": 40.52, "elapsed_time": "0:25:54", "remaining_time": "0:38:02", "throughput": 5765.26, "total_tokens": 8964264} {"current_steps": 13750, "total_steps": 33920, "loss": 0.4015, "lr": 7.41891610036999e-06, "epoch": 8.107311320754716, "percentage": 40.54, "elapsed_time": "0:25:55", "remaining_time": "0:38:01", "throughput": 5765.02, "total_tokens": 8966728} {"current_steps": 13755, "total_steps": 33920, "loss": 0.2923, "lr": 7.416664172095732e-06, "epoch": 8.110259433962264, "percentage": 40.55, "elapsed_time": "0:25:55", "remaining_time": "0:38:00", "throughput": 5764.97, "total_tokens": 8969544} {"current_steps": 13760, "total_steps": 33920, "loss": 0.3625, "lr": 7.414411603999221e-06, "epoch": 8.11320754716981, "percentage": 40.57, "elapsed_time": "0:25:56", "remaining_time": "0:38:00", "throughput": 5765.12, "total_tokens": 8972776} {"current_steps": 13765, "total_steps": 33920, "loss": 0.3316, "lr": 7.4121583966768295e-06, "epoch": 8.116155660377359, "percentage": 40.58, "elapsed_time": "0:25:56", "remaining_time": "0:37:59", "throughput": 5765.15, "total_tokens": 8975624} {"current_steps": 13770, "total_steps": 33920, "loss": 0.4319, "lr": 7.409904550725109e-06, "epoch": 8.119103773584905, "percentage": 40.6, "elapsed_time": "0:25:57", "remaining_time": "0:37:59", "throughput": 5765.64, "total_tokens": 8980392} {"current_steps": 13775, "total_steps": 33920, "loss": 0.433, "lr": 7.407650066740771e-06, "epoch": 8.122051886792454, "percentage": 40.61, "elapsed_time": "0:25:58", "remaining_time": "0:37:58", "throughput": 5765.79, "total_tokens": 8984008} {"current_steps": 13780, "total_steps": 33920, "loss": 0.3382, "lr": 7.405394945320702e-06, "epoch": 8.125, "percentage": 40.62, "elapsed_time": "0:25:58", "remaining_time": "0:37:58", "throughput": 5765.88, "total_tokens": 8987304} {"current_steps": 13785, "total_steps": 33920, "loss": 0.4656, "lr": 7.403139187061955e-06, "epoch": 8.127948113207546, "percentage": 40.64, "elapsed_time": "0:25:59", "remaining_time": "0:37:57", "throughput": 5765.76, "total_tokens": 8990216} {"current_steps": 13790, "total_steps": 33920, "loss": 0.4925, "lr": 7.400882792561752e-06, "epoch": 8.130896226415095, "percentage": 40.65, "elapsed_time": "0:25:59", "remaining_time": "0:37:56", "throughput": 5765.74, "total_tokens": 8993480} {"current_steps": 13795, "total_steps": 33920, "loss": 0.3748, "lr": 7.39862576241748e-06, "epoch": 8.133844339622641, "percentage": 40.67, "elapsed_time": "0:26:00", "remaining_time": "0:37:56", "throughput": 5766.23, "total_tokens": 8999112} {"current_steps": 13800, "total_steps": 33920, "loss": 0.4129, "lr": 7.396368097226703e-06, "epoch": 8.13679245283019, "percentage": 40.68, "elapsed_time": "0:26:01", "remaining_time": "0:37:56", "throughput": 5766.47, "total_tokens": 9002824} {"current_steps": 13805, "total_steps": 33920, "loss": 0.4775, "lr": 7.394109797587144e-06, "epoch": 8.139740566037736, "percentage": 40.7, "elapsed_time": "0:26:01", "remaining_time": "0:37:55", "throughput": 5766.56, "total_tokens": 9005736} {"current_steps": 13810, "total_steps": 33920, "loss": 0.4175, "lr": 7.3918508640966956e-06, "epoch": 8.142688679245284, "percentage": 40.71, "elapsed_time": "0:26:02", "remaining_time": "0:37:55", "throughput": 5766.67, "total_tokens": 9009416} {"current_steps": 13815, "total_steps": 33920, "loss": 0.4633, "lr": 7.389591297353424e-06, "epoch": 8.14563679245283, "percentage": 40.73, "elapsed_time": "0:26:02", "remaining_time": "0:37:54", "throughput": 5766.79, "total_tokens": 9012456} {"current_steps": 13820, "total_steps": 33920, "loss": 0.376, "lr": 7.3873310979555565e-06, "epoch": 8.148584905660377, "percentage": 40.74, "elapsed_time": "0:26:03", "remaining_time": "0:37:53", "throughput": 5766.86, "total_tokens": 9015528} {"current_steps": 13825, "total_steps": 33920, "loss": 0.3802, "lr": 7.385070266501495e-06, "epoch": 8.151533018867925, "percentage": 40.76, "elapsed_time": "0:26:03", "remaining_time": "0:37:53", "throughput": 5767.13, "total_tokens": 9019112} {"current_steps": 13830, "total_steps": 33920, "loss": 0.3897, "lr": 7.382808803589798e-06, "epoch": 8.154481132075471, "percentage": 40.77, "elapsed_time": "0:26:04", "remaining_time": "0:37:52", "throughput": 5767.14, "total_tokens": 9021736} {"current_steps": 13835, "total_steps": 33920, "loss": 0.4062, "lr": 7.380546709819204e-06, "epoch": 8.15742924528302, "percentage": 40.79, "elapsed_time": "0:26:04", "remaining_time": "0:37:51", "throughput": 5767.23, "total_tokens": 9024936} {"current_steps": 13840, "total_steps": 33920, "loss": 0.372, "lr": 7.378283985788608e-06, "epoch": 8.160377358490566, "percentage": 40.8, "elapsed_time": "0:26:05", "remaining_time": "0:37:51", "throughput": 5767.24, "total_tokens": 9027560} {"current_steps": 13845, "total_steps": 33920, "loss": 0.4653, "lr": 7.376020632097076e-06, "epoch": 8.163325471698114, "percentage": 40.82, "elapsed_time": "0:26:05", "remaining_time": "0:37:50", "throughput": 5767.41, "total_tokens": 9030504} {"current_steps": 13850, "total_steps": 33920, "loss": 0.2937, "lr": 7.373756649343841e-06, "epoch": 8.16627358490566, "percentage": 40.83, "elapsed_time": "0:26:06", "remaining_time": "0:37:49", "throughput": 5767.57, "total_tokens": 9033704} {"current_steps": 13855, "total_steps": 33920, "loss": 0.3975, "lr": 7.371492038128305e-06, "epoch": 8.169221698113208, "percentage": 40.85, "elapsed_time": "0:26:06", "remaining_time": "0:37:49", "throughput": 5767.96, "total_tokens": 9037800} {"current_steps": 13860, "total_steps": 33920, "loss": 0.3701, "lr": 7.36922679905003e-06, "epoch": 8.172169811320755, "percentage": 40.86, "elapsed_time": "0:26:07", "remaining_time": "0:37:48", "throughput": 5768.2, "total_tokens": 9041160} {"current_steps": 13865, "total_steps": 33920, "loss": 0.3279, "lr": 7.366960932708749e-06, "epoch": 8.175117924528301, "percentage": 40.88, "elapsed_time": "0:26:07", "remaining_time": "0:37:47", "throughput": 5768.26, "total_tokens": 9044200} {"current_steps": 13870, "total_steps": 33920, "loss": 0.348, "lr": 7.364694439704361e-06, "epoch": 8.17806603773585, "percentage": 40.89, "elapsed_time": "0:26:08", "remaining_time": "0:37:47", "throughput": 5768.22, "total_tokens": 9046856} {"current_steps": 13875, "total_steps": 33920, "loss": 0.2514, "lr": 7.3624273206369264e-06, "epoch": 8.181014150943396, "percentage": 40.91, "elapsed_time": "0:26:08", "remaining_time": "0:37:46", "throughput": 5768.11, "total_tokens": 9049288} {"current_steps": 13880, "total_steps": 33920, "loss": 0.3868, "lr": 7.360159576106681e-06, "epoch": 8.183962264150944, "percentage": 40.92, "elapsed_time": "0:26:09", "remaining_time": "0:37:45", "throughput": 5768.07, "total_tokens": 9051976} {"current_steps": 13885, "total_steps": 33920, "loss": 0.2955, "lr": 7.357891206714014e-06, "epoch": 8.18691037735849, "percentage": 40.93, "elapsed_time": "0:26:09", "remaining_time": "0:37:45", "throughput": 5768.31, "total_tokens": 9055336} {"current_steps": 13890, "total_steps": 33920, "loss": 0.3901, "lr": 7.355622213059487e-06, "epoch": 8.189858490566039, "percentage": 40.95, "elapsed_time": "0:26:10", "remaining_time": "0:37:44", "throughput": 5768.3, "total_tokens": 9058120} {"current_steps": 13895, "total_steps": 33920, "loss": 0.2998, "lr": 7.353352595743829e-06, "epoch": 8.192806603773585, "percentage": 40.96, "elapsed_time": "0:26:10", "remaining_time": "0:37:43", "throughput": 5768.39, "total_tokens": 9061160} {"current_steps": 13900, "total_steps": 33920, "loss": 0.4522, "lr": 7.351082355367928e-06, "epoch": 8.195754716981131, "percentage": 40.98, "elapsed_time": "0:26:11", "remaining_time": "0:37:43", "throughput": 5768.55, "total_tokens": 9064552} {"current_steps": 13905, "total_steps": 33920, "loss": 0.3219, "lr": 7.34881149253284e-06, "epoch": 8.19870283018868, "percentage": 40.99, "elapsed_time": "0:26:11", "remaining_time": "0:37:42", "throughput": 5768.8, "total_tokens": 9068488} {"current_steps": 13910, "total_steps": 33920, "loss": 0.4691, "lr": 7.346540007839787e-06, "epoch": 8.201650943396226, "percentage": 41.01, "elapsed_time": "0:26:12", "remaining_time": "0:37:42", "throughput": 5769.01, "total_tokens": 9071752} {"current_steps": 13915, "total_steps": 33920, "loss": 0.4471, "lr": 7.344267901890154e-06, "epoch": 8.204599056603774, "percentage": 41.02, "elapsed_time": "0:26:12", "remaining_time": "0:37:41", "throughput": 5768.84, "total_tokens": 9074120} {"current_steps": 13920, "total_steps": 33920, "loss": 0.4004, "lr": 7.341995175285491e-06, "epoch": 8.20754716981132, "percentage": 41.04, "elapsed_time": "0:26:13", "remaining_time": "0:37:40", "throughput": 5768.84, "total_tokens": 9076968} {"current_steps": 13925, "total_steps": 33920, "loss": 0.4406, "lr": 7.339721828627512e-06, "epoch": 8.210495283018869, "percentage": 41.05, "elapsed_time": "0:26:13", "remaining_time": "0:37:40", "throughput": 5769.08, "total_tokens": 9080264} {"current_steps": 13930, "total_steps": 33920, "loss": 0.2811, "lr": 7.337447862518096e-06, "epoch": 8.213443396226415, "percentage": 41.07, "elapsed_time": "0:26:14", "remaining_time": "0:37:39", "throughput": 5769.04, "total_tokens": 9082984} {"current_steps": 13935, "total_steps": 33920, "loss": 0.3452, "lr": 7.335173277559282e-06, "epoch": 8.216391509433961, "percentage": 41.08, "elapsed_time": "0:26:14", "remaining_time": "0:37:38", "throughput": 5769.25, "total_tokens": 9086344} {"current_steps": 13940, "total_steps": 33920, "loss": 0.3691, "lr": 7.332898074353281e-06, "epoch": 8.21933962264151, "percentage": 41.1, "elapsed_time": "0:26:15", "remaining_time": "0:37:38", "throughput": 5769.38, "total_tokens": 9089448} {"current_steps": 13945, "total_steps": 33920, "loss": 0.2899, "lr": 7.330622253502461e-06, "epoch": 8.222287735849056, "percentage": 41.11, "elapsed_time": "0:26:15", "remaining_time": "0:37:37", "throughput": 5769.57, "total_tokens": 9092680} {"current_steps": 13950, "total_steps": 33920, "loss": 0.2974, "lr": 7.3283458156093534e-06, "epoch": 8.225235849056604, "percentage": 41.13, "elapsed_time": "0:26:16", "remaining_time": "0:37:36", "throughput": 5769.49, "total_tokens": 9095304} {"current_steps": 13955, "total_steps": 33920, "loss": 0.3705, "lr": 7.326068761276657e-06, "epoch": 8.22818396226415, "percentage": 41.14, "elapsed_time": "0:26:16", "remaining_time": "0:37:36", "throughput": 5769.63, "total_tokens": 9098504} {"current_steps": 13960, "total_steps": 33920, "loss": 0.36, "lr": 7.323791091107231e-06, "epoch": 8.231132075471699, "percentage": 41.16, "elapsed_time": "0:26:17", "remaining_time": "0:37:35", "throughput": 5769.71, "total_tokens": 9101512} {"current_steps": 13965, "total_steps": 33920, "loss": 0.4934, "lr": 7.3215128057040986e-06, "epoch": 8.234080188679245, "percentage": 41.17, "elapsed_time": "0:26:17", "remaining_time": "0:37:34", "throughput": 5769.58, "total_tokens": 9103880} {"current_steps": 13970, "total_steps": 33920, "loss": 0.4085, "lr": 7.319233905670447e-06, "epoch": 8.237028301886792, "percentage": 41.19, "elapsed_time": "0:26:18", "remaining_time": "0:37:34", "throughput": 5769.52, "total_tokens": 9106440} {"current_steps": 13975, "total_steps": 33920, "loss": 0.3234, "lr": 7.316954391609622e-06, "epoch": 8.23997641509434, "percentage": 41.2, "elapsed_time": "0:26:18", "remaining_time": "0:37:33", "throughput": 5769.58, "total_tokens": 9109576} {"current_steps": 13980, "total_steps": 33920, "loss": 0.4577, "lr": 7.314674264125137e-06, "epoch": 8.242924528301886, "percentage": 41.21, "elapsed_time": "0:26:19", "remaining_time": "0:37:32", "throughput": 5769.78, "total_tokens": 9113128} {"current_steps": 13985, "total_steps": 33920, "loss": 0.46, "lr": 7.312393523820665e-06, "epoch": 8.245872641509434, "percentage": 41.23, "elapsed_time": "0:26:20", "remaining_time": "0:37:32", "throughput": 5769.88, "total_tokens": 9116552} {"current_steps": 13990, "total_steps": 33920, "loss": 0.4312, "lr": 7.310112171300041e-06, "epoch": 8.24882075471698, "percentage": 41.24, "elapsed_time": "0:26:20", "remaining_time": "0:37:31", "throughput": 5769.94, "total_tokens": 9119656} {"current_steps": 13995, "total_steps": 33920, "loss": 0.4338, "lr": 7.307830207167263e-06, "epoch": 8.251768867924529, "percentage": 41.26, "elapsed_time": "0:26:21", "remaining_time": "0:37:30", "throughput": 5769.98, "total_tokens": 9122568} {"current_steps": 14000, "total_steps": 33920, "loss": 0.4016, "lr": 7.305547632026493e-06, "epoch": 8.254716981132075, "percentage": 41.27, "elapsed_time": "0:26:21", "remaining_time": "0:37:30", "throughput": 5769.87, "total_tokens": 9125160} {"current_steps": 14005, "total_steps": 33920, "loss": 0.4734, "lr": 7.3032644464820515e-06, "epoch": 8.257665094339623, "percentage": 41.29, "elapsed_time": "0:26:22", "remaining_time": "0:37:29", "throughput": 5770.02, "total_tokens": 9128520} {"current_steps": 14010, "total_steps": 33920, "loss": 0.3919, "lr": 7.30098065113842e-06, "epoch": 8.26061320754717, "percentage": 41.3, "elapsed_time": "0:26:22", "remaining_time": "0:37:29", "throughput": 5770.29, "total_tokens": 9132104} {"current_steps": 14015, "total_steps": 33920, "loss": 0.4209, "lr": 7.298696246600244e-06, "epoch": 8.263561320754716, "percentage": 41.32, "elapsed_time": "0:26:23", "remaining_time": "0:37:28", "throughput": 5770.38, "total_tokens": 9135432} {"current_steps": 14020, "total_steps": 33920, "loss": 0.3581, "lr": 7.2964112334723315e-06, "epoch": 8.266509433962264, "percentage": 41.33, "elapsed_time": "0:26:23", "remaining_time": "0:37:28", "throughput": 5770.88, "total_tokens": 9139944} {"current_steps": 14025, "total_steps": 33920, "loss": 0.389, "lr": 7.294125612359647e-06, "epoch": 8.26945754716981, "percentage": 41.35, "elapsed_time": "0:26:24", "remaining_time": "0:37:27", "throughput": 5771.0, "total_tokens": 9143208} {"current_steps": 14030, "total_steps": 33920, "loss": 0.2363, "lr": 7.291839383867318e-06, "epoch": 8.272405660377359, "percentage": 41.36, "elapsed_time": "0:26:24", "remaining_time": "0:37:26", "throughput": 5771.1, "total_tokens": 9146216} {"current_steps": 14035, "total_steps": 33920, "loss": 0.3073, "lr": 7.289552548600638e-06, "epoch": 8.275353773584905, "percentage": 41.38, "elapsed_time": "0:26:25", "remaining_time": "0:37:26", "throughput": 5771.2, "total_tokens": 9149288} {"current_steps": 14040, "total_steps": 33920, "loss": 0.3135, "lr": 7.287265107165052e-06, "epoch": 8.278301886792454, "percentage": 41.39, "elapsed_time": "0:26:25", "remaining_time": "0:37:25", "throughput": 5771.54, "total_tokens": 9153448} {"current_steps": 14045, "total_steps": 33920, "loss": 0.4462, "lr": 7.284977060166171e-06, "epoch": 8.28125, "percentage": 41.41, "elapsed_time": "0:26:26", "remaining_time": "0:37:25", "throughput": 5771.97, "total_tokens": 9157832} {"current_steps": 14050, "total_steps": 33920, "loss": 0.4026, "lr": 7.282688408209766e-06, "epoch": 8.284198113207546, "percentage": 41.42, "elapsed_time": "0:26:27", "remaining_time": "0:37:24", "throughput": 5772.16, "total_tokens": 9161096} {"current_steps": 14055, "total_steps": 33920, "loss": 0.4475, "lr": 7.2803991519017655e-06, "epoch": 8.287146226415095, "percentage": 41.44, "elapsed_time": "0:26:27", "remaining_time": "0:37:23", "throughput": 5772.19, "total_tokens": 9164104} {"current_steps": 14060, "total_steps": 33920, "loss": 0.4329, "lr": 7.2781092918482634e-06, "epoch": 8.290094339622641, "percentage": 41.45, "elapsed_time": "0:26:28", "remaining_time": "0:37:23", "throughput": 5772.2, "total_tokens": 9166728} {"current_steps": 14065, "total_steps": 33920, "loss": 0.4178, "lr": 7.275818828655508e-06, "epoch": 8.29304245283019, "percentage": 41.47, "elapsed_time": "0:26:28", "remaining_time": "0:37:22", "throughput": 5772.29, "total_tokens": 9170056} {"current_steps": 14070, "total_steps": 33920, "loss": 0.3621, "lr": 7.27352776292991e-06, "epoch": 8.295990566037736, "percentage": 41.48, "elapsed_time": "0:26:29", "remaining_time": "0:37:21", "throughput": 5772.38, "total_tokens": 9173192} {"current_steps": 14075, "total_steps": 33920, "loss": 0.4185, "lr": 7.271236095278036e-06, "epoch": 8.298938679245284, "percentage": 41.49, "elapsed_time": "0:26:29", "remaining_time": "0:37:21", "throughput": 5772.53, "total_tokens": 9176616} {"current_steps": 14080, "total_steps": 33920, "loss": 0.4694, "lr": 7.2689438263066195e-06, "epoch": 8.30188679245283, "percentage": 41.51, "elapsed_time": "0:26:30", "remaining_time": "0:37:20", "throughput": 5772.71, "total_tokens": 9179976} {"current_steps": 14085, "total_steps": 33920, "loss": 0.4752, "lr": 7.266650956622546e-06, "epoch": 8.304834905660377, "percentage": 41.52, "elapsed_time": "0:26:30", "remaining_time": "0:37:20", "throughput": 5772.68, "total_tokens": 9183080} {"current_steps": 14090, "total_steps": 33920, "loss": 0.4647, "lr": 7.2643574868328625e-06, "epoch": 8.307783018867925, "percentage": 41.54, "elapsed_time": "0:26:31", "remaining_time": "0:37:19", "throughput": 5772.54, "total_tokens": 9185416} {"current_steps": 14095, "total_steps": 33920, "loss": 0.3161, "lr": 7.262063417544776e-06, "epoch": 8.310731132075471, "percentage": 41.55, "elapsed_time": "0:26:31", "remaining_time": "0:37:18", "throughput": 5772.65, "total_tokens": 9188392} {"current_steps": 14100, "total_steps": 33920, "loss": 0.4071, "lr": 7.25976874936565e-06, "epoch": 8.31367924528302, "percentage": 41.57, "elapsed_time": "0:26:32", "remaining_time": "0:37:18", "throughput": 5772.94, "total_tokens": 9192360} {"current_steps": 14105, "total_steps": 33920, "loss": 0.4578, "lr": 7.257473482903009e-06, "epoch": 8.316627358490566, "percentage": 41.58, "elapsed_time": "0:26:32", "remaining_time": "0:37:17", "throughput": 5772.74, "total_tokens": 9194728} {"current_steps": 14110, "total_steps": 33920, "loss": 0.4118, "lr": 7.255177618764534e-06, "epoch": 8.319575471698114, "percentage": 41.6, "elapsed_time": "0:26:33", "remaining_time": "0:37:16", "throughput": 5772.93, "total_tokens": 9198216} {"current_steps": 14115, "total_steps": 33920, "loss": 0.4386, "lr": 7.252881157558065e-06, "epoch": 8.32252358490566, "percentage": 41.61, "elapsed_time": "0:26:33", "remaining_time": "0:37:16", "throughput": 5773.17, "total_tokens": 9201768} {"current_steps": 14120, "total_steps": 33920, "loss": 0.3745, "lr": 7.250584099891602e-06, "epoch": 8.325471698113208, "percentage": 41.63, "elapsed_time": "0:26:34", "remaining_time": "0:37:15", "throughput": 5773.25, "total_tokens": 9204712} {"current_steps": 14125, "total_steps": 33920, "loss": 0.3689, "lr": 7.248286446373296e-06, "epoch": 8.328419811320755, "percentage": 41.64, "elapsed_time": "0:26:34", "remaining_time": "0:37:15", "throughput": 5773.11, "total_tokens": 9207112} {"current_steps": 14130, "total_steps": 33920, "loss": 0.3721, "lr": 7.245988197611466e-06, "epoch": 8.331367924528301, "percentage": 41.66, "elapsed_time": "0:26:35", "remaining_time": "0:37:14", "throughput": 5773.36, "total_tokens": 9210568} {"current_steps": 14135, "total_steps": 33920, "loss": 0.3289, "lr": 7.2436893542145805e-06, "epoch": 8.33431603773585, "percentage": 41.67, "elapsed_time": "0:26:35", "remaining_time": "0:37:13", "throughput": 5773.44, "total_tokens": 9214248} {"current_steps": 14140, "total_steps": 33920, "loss": 0.4597, "lr": 7.241389916791269e-06, "epoch": 8.337264150943396, "percentage": 41.69, "elapsed_time": "0:26:36", "remaining_time": "0:37:13", "throughput": 5773.85, "total_tokens": 9218376} {"current_steps": 14145, "total_steps": 33920, "loss": 0.4129, "lr": 7.239089885950317e-06, "epoch": 8.340212264150944, "percentage": 41.7, "elapsed_time": "0:26:37", "remaining_time": "0:37:12", "throughput": 5774.13, "total_tokens": 9222152} {"current_steps": 14150, "total_steps": 33920, "loss": 0.3677, "lr": 7.236789262300667e-06, "epoch": 8.34316037735849, "percentage": 41.72, "elapsed_time": "0:26:37", "remaining_time": "0:37:12", "throughput": 5774.23, "total_tokens": 9225448} {"current_steps": 14155, "total_steps": 33920, "loss": 0.4122, "lr": 7.23448804645142e-06, "epoch": 8.346108490566039, "percentage": 41.73, "elapsed_time": "0:26:38", "remaining_time": "0:37:11", "throughput": 5774.51, "total_tokens": 9228904} {"current_steps": 14160, "total_steps": 33920, "loss": 0.3969, "lr": 7.232186239011834e-06, "epoch": 8.349056603773585, "percentage": 41.75, "elapsed_time": "0:26:38", "remaining_time": "0:37:11", "throughput": 5774.66, "total_tokens": 9232456} {"current_steps": 14165, "total_steps": 33920, "loss": 0.3695, "lr": 7.2298838405913195e-06, "epoch": 8.352004716981131, "percentage": 41.76, "elapsed_time": "0:26:39", "remaining_time": "0:37:10", "throughput": 5774.79, "total_tokens": 9235496} {"current_steps": 14170, "total_steps": 33920, "loss": 0.4045, "lr": 7.227580851799448e-06, "epoch": 8.35495283018868, "percentage": 41.77, "elapsed_time": "0:26:39", "remaining_time": "0:37:09", "throughput": 5774.79, "total_tokens": 9238184} {"current_steps": 14175, "total_steps": 33920, "loss": 0.4096, "lr": 7.2252772732459455e-06, "epoch": 8.357900943396226, "percentage": 41.79, "elapsed_time": "0:26:40", "remaining_time": "0:37:08", "throughput": 5774.74, "total_tokens": 9240680} {"current_steps": 14180, "total_steps": 33920, "loss": 0.3944, "lr": 7.222973105540696e-06, "epoch": 8.360849056603774, "percentage": 41.8, "elapsed_time": "0:26:40", "remaining_time": "0:37:08", "throughput": 5774.94, "total_tokens": 9243944} {"current_steps": 14185, "total_steps": 33920, "loss": 0.3471, "lr": 7.2206683492937345e-06, "epoch": 8.36379716981132, "percentage": 41.82, "elapsed_time": "0:26:41", "remaining_time": "0:37:07", "throughput": 5774.91, "total_tokens": 9246792} {"current_steps": 14190, "total_steps": 33920, "loss": 0.3932, "lr": 7.218363005115259e-06, "epoch": 8.366745283018869, "percentage": 41.83, "elapsed_time": "0:26:41", "remaining_time": "0:37:07", "throughput": 5775.3, "total_tokens": 9251048} {"current_steps": 14195, "total_steps": 33920, "loss": 0.4088, "lr": 7.216057073615617e-06, "epoch": 8.369693396226415, "percentage": 41.85, "elapsed_time": "0:26:42", "remaining_time": "0:37:06", "throughput": 5775.61, "total_tokens": 9254856} {"current_steps": 14200, "total_steps": 33920, "loss": 0.4401, "lr": 7.21375055540531e-06, "epoch": 8.372641509433961, "percentage": 41.86, "elapsed_time": "0:26:42", "remaining_time": "0:37:05", "throughput": 5775.69, "total_tokens": 9257832} {"current_steps": 14205, "total_steps": 33920, "loss": 0.3207, "lr": 7.211443451095007e-06, "epoch": 8.37558962264151, "percentage": 41.88, "elapsed_time": "0:26:43", "remaining_time": "0:37:05", "throughput": 5775.89, "total_tokens": 9261352} {"current_steps": 14210, "total_steps": 33920, "loss": 0.3891, "lr": 7.2091357612955185e-06, "epoch": 8.378537735849056, "percentage": 41.89, "elapsed_time": "0:26:44", "remaining_time": "0:37:04", "throughput": 5776.23, "total_tokens": 9265096} {"current_steps": 14215, "total_steps": 33920, "loss": 0.3951, "lr": 7.206827486617816e-06, "epoch": 8.381485849056604, "percentage": 41.91, "elapsed_time": "0:26:44", "remaining_time": "0:37:04", "throughput": 5776.57, "total_tokens": 9268904} {"current_steps": 14220, "total_steps": 33920, "loss": 0.5359, "lr": 7.204518627673026e-06, "epoch": 8.38443396226415, "percentage": 41.92, "elapsed_time": "0:26:45", "remaining_time": "0:37:03", "throughput": 5776.45, "total_tokens": 9271464} {"current_steps": 14225, "total_steps": 33920, "loss": 0.549, "lr": 7.202209185072428e-06, "epoch": 8.387382075471699, "percentage": 41.94, "elapsed_time": "0:26:45", "remaining_time": "0:37:02", "throughput": 5776.44, "total_tokens": 9274280} {"current_steps": 14230, "total_steps": 33920, "loss": 0.3769, "lr": 7.199899159427457e-06, "epoch": 8.390330188679245, "percentage": 41.95, "elapsed_time": "0:26:46", "remaining_time": "0:37:02", "throughput": 5776.44, "total_tokens": 9277224} {"current_steps": 14235, "total_steps": 33920, "loss": 0.3814, "lr": 7.1975885513497035e-06, "epoch": 8.393278301886792, "percentage": 41.97, "elapsed_time": "0:26:46", "remaining_time": "0:37:01", "throughput": 5776.8, "total_tokens": 9281224} {"current_steps": 14240, "total_steps": 33920, "loss": 0.4956, "lr": 7.195277361450909e-06, "epoch": 8.39622641509434, "percentage": 41.98, "elapsed_time": "0:26:47", "remaining_time": "0:37:01", "throughput": 5776.75, "total_tokens": 9283912} {"current_steps": 14245, "total_steps": 33920, "loss": 0.628, "lr": 7.192965590342973e-06, "epoch": 8.399174528301886, "percentage": 42.0, "elapsed_time": "0:26:47", "remaining_time": "0:37:00", "throughput": 5777.19, "total_tokens": 9288616} {"current_steps": 14250, "total_steps": 33920, "loss": 0.493, "lr": 7.190653238637945e-06, "epoch": 8.402122641509434, "percentage": 42.01, "elapsed_time": "0:26:48", "remaining_time": "0:36:59", "throughput": 5777.23, "total_tokens": 9291400} {"current_steps": 14255, "total_steps": 33920, "loss": 0.4921, "lr": 7.18834030694803e-06, "epoch": 8.40507075471698, "percentage": 42.03, "elapsed_time": "0:26:48", "remaining_time": "0:36:59", "throughput": 5777.36, "total_tokens": 9294632} {"current_steps": 14260, "total_steps": 33920, "loss": 0.4218, "lr": 7.186026795885589e-06, "epoch": 8.408018867924529, "percentage": 42.04, "elapsed_time": "0:26:49", "remaining_time": "0:36:58", "throughput": 5777.74, "total_tokens": 9298664} {"current_steps": 14265, "total_steps": 33920, "loss": 0.3715, "lr": 7.183712706063133e-06, "epoch": 8.410966981132075, "percentage": 42.05, "elapsed_time": "0:26:49", "remaining_time": "0:36:58", "throughput": 5777.84, "total_tokens": 9301544} {"current_steps": 14270, "total_steps": 33920, "loss": 0.4263, "lr": 7.1813980380933255e-06, "epoch": 8.413915094339623, "percentage": 42.07, "elapsed_time": "0:26:50", "remaining_time": "0:36:57", "throughput": 5777.87, "total_tokens": 9304648} {"current_steps": 14275, "total_steps": 33920, "loss": 0.3954, "lr": 7.179082792588986e-06, "epoch": 8.41686320754717, "percentage": 42.08, "elapsed_time": "0:26:50", "remaining_time": "0:36:56", "throughput": 5777.99, "total_tokens": 9307752} {"current_steps": 14280, "total_steps": 33920, "loss": 0.3884, "lr": 7.176766970163087e-06, "epoch": 8.419811320754716, "percentage": 42.1, "elapsed_time": "0:26:51", "remaining_time": "0:36:56", "throughput": 5778.03, "total_tokens": 9310472} {"current_steps": 14285, "total_steps": 33920, "loss": 0.3593, "lr": 7.17445057142875e-06, "epoch": 8.422759433962264, "percentage": 42.11, "elapsed_time": "0:26:51", "remaining_time": "0:36:55", "throughput": 5778.36, "total_tokens": 9314312} {"current_steps": 14290, "total_steps": 33920, "loss": 0.3455, "lr": 7.172133596999253e-06, "epoch": 8.42570754716981, "percentage": 42.13, "elapsed_time": "0:26:52", "remaining_time": "0:36:55", "throughput": 5778.51, "total_tokens": 9317704} {"current_steps": 14295, "total_steps": 33920, "loss": 0.5131, "lr": 7.1698160474880255e-06, "epoch": 8.428655660377359, "percentage": 42.14, "elapsed_time": "0:26:52", "remaining_time": "0:36:54", "throughput": 5778.74, "total_tokens": 9321000} {"current_steps": 14300, "total_steps": 33920, "loss": 0.3584, "lr": 7.167497923508648e-06, "epoch": 8.431603773584905, "percentage": 42.16, "elapsed_time": "0:26:53", "remaining_time": "0:36:53", "throughput": 5778.64, "total_tokens": 9323688} {"current_steps": 14305, "total_steps": 33920, "loss": 0.4258, "lr": 7.165179225674854e-06, "epoch": 8.434551886792454, "percentage": 42.17, "elapsed_time": "0:26:53", "remaining_time": "0:36:53", "throughput": 5778.71, "total_tokens": 9326568} {"current_steps": 14310, "total_steps": 33920, "loss": 0.338, "lr": 7.1628599546005276e-06, "epoch": 8.4375, "percentage": 42.19, "elapsed_time": "0:26:54", "remaining_time": "0:36:52", "throughput": 5778.73, "total_tokens": 9329224} {"current_steps": 14315, "total_steps": 33920, "loss": 0.3929, "lr": 7.160540110899708e-06, "epoch": 8.440448113207546, "percentage": 42.2, "elapsed_time": "0:26:54", "remaining_time": "0:36:51", "throughput": 5778.81, "total_tokens": 9332360} {"current_steps": 14320, "total_steps": 33920, "loss": 0.5698, "lr": 7.158219695186582e-06, "epoch": 8.443396226415095, "percentage": 42.22, "elapsed_time": "0:26:55", "remaining_time": "0:36:51", "throughput": 5778.75, "total_tokens": 9335176} {"current_steps": 14325, "total_steps": 33920, "loss": 0.456, "lr": 7.1558987080754905e-06, "epoch": 8.446344339622641, "percentage": 42.23, "elapsed_time": "0:26:56", "remaining_time": "0:36:50", "throughput": 5779.17, "total_tokens": 9339624} {"current_steps": 14330, "total_steps": 33920, "loss": 0.4361, "lr": 7.1535771501809245e-06, "epoch": 8.44929245283019, "percentage": 42.25, "elapsed_time": "0:26:56", "remaining_time": "0:36:49", "throughput": 5779.22, "total_tokens": 9342696} {"current_steps": 14335, "total_steps": 33920, "loss": 0.3994, "lr": 7.151255022117527e-06, "epoch": 8.452240566037736, "percentage": 42.26, "elapsed_time": "0:26:57", "remaining_time": "0:36:49", "throughput": 5779.05, "total_tokens": 9345000} {"current_steps": 14340, "total_steps": 33920, "loss": 0.2395, "lr": 7.148932324500091e-06, "epoch": 8.455188679245284, "percentage": 42.28, "elapsed_time": "0:26:57", "remaining_time": "0:36:48", "throughput": 5779.17, "total_tokens": 9348072} {"current_steps": 14345, "total_steps": 33920, "loss": 0.3975, "lr": 7.146609057943559e-06, "epoch": 8.45813679245283, "percentage": 42.29, "elapsed_time": "0:26:58", "remaining_time": "0:36:48", "throughput": 5779.41, "total_tokens": 9351592} {"current_steps": 14350, "total_steps": 33920, "loss": 0.4588, "lr": 7.14428522306303e-06, "epoch": 8.461084905660377, "percentage": 42.31, "elapsed_time": "0:26:58", "remaining_time": "0:36:47", "throughput": 5779.41, "total_tokens": 9354312} {"current_steps": 14355, "total_steps": 33920, "loss": 0.302, "lr": 7.141960820473745e-06, "epoch": 8.464033018867925, "percentage": 42.32, "elapsed_time": "0:26:59", "remaining_time": "0:36:46", "throughput": 5779.44, "total_tokens": 9357288} {"current_steps": 14360, "total_steps": 33920, "loss": 0.4624, "lr": 7.139635850791102e-06, "epoch": 8.466981132075471, "percentage": 42.33, "elapsed_time": "0:26:59", "remaining_time": "0:36:45", "throughput": 5779.49, "total_tokens": 9360040} {"current_steps": 14365, "total_steps": 33920, "loss": 0.4772, "lr": 7.137310314630647e-06, "epoch": 8.46992924528302, "percentage": 42.35, "elapsed_time": "0:27:00", "remaining_time": "0:36:45", "throughput": 5779.61, "total_tokens": 9363112} {"current_steps": 14370, "total_steps": 33920, "loss": 0.3807, "lr": 7.134984212608074e-06, "epoch": 8.472877358490566, "percentage": 42.36, "elapsed_time": "0:27:00", "remaining_time": "0:36:45", "throughput": 5780.22, "total_tokens": 9369000} {"current_steps": 14375, "total_steps": 33920, "loss": 0.3546, "lr": 7.13265754533923e-06, "epoch": 8.475825471698114, "percentage": 42.38, "elapsed_time": "0:27:01", "remaining_time": "0:36:44", "throughput": 5780.32, "total_tokens": 9372264} {"current_steps": 14380, "total_steps": 33920, "loss": 0.4717, "lr": 7.130330313440109e-06, "epoch": 8.47877358490566, "percentage": 42.39, "elapsed_time": "0:27:01", "remaining_time": "0:36:43", "throughput": 5780.37, "total_tokens": 9375176} {"current_steps": 14385, "total_steps": 33920, "loss": 0.3451, "lr": 7.128002517526856e-06, "epoch": 8.481721698113208, "percentage": 42.41, "elapsed_time": "0:27:02", "remaining_time": "0:36:43", "throughput": 5780.42, "total_tokens": 9378088} {"current_steps": 14390, "total_steps": 33920, "loss": 0.3807, "lr": 7.1256741582157654e-06, "epoch": 8.484669811320755, "percentage": 42.42, "elapsed_time": "0:27:02", "remaining_time": "0:36:42", "throughput": 5780.61, "total_tokens": 9381448} {"current_steps": 14395, "total_steps": 33920, "loss": 0.3888, "lr": 7.123345236123282e-06, "epoch": 8.487617924528301, "percentage": 42.44, "elapsed_time": "0:27:03", "remaining_time": "0:36:42", "throughput": 5780.93, "total_tokens": 9385576} {"current_steps": 14400, "total_steps": 33920, "loss": 0.3748, "lr": 7.121015751865994e-06, "epoch": 8.49056603773585, "percentage": 42.45, "elapsed_time": "0:27:04", "remaining_time": "0:36:41", "throughput": 5780.91, "total_tokens": 9388296} {"current_steps": 14405, "total_steps": 33920, "loss": 0.4586, "lr": 7.118685706060645e-06, "epoch": 8.493514150943396, "percentage": 42.47, "elapsed_time": "0:27:04", "remaining_time": "0:36:40", "throughput": 5781.31, "total_tokens": 9392552} {"current_steps": 14410, "total_steps": 33920, "loss": 0.3036, "lr": 7.116355099324126e-06, "epoch": 8.496462264150944, "percentage": 42.48, "elapsed_time": "0:27:05", "remaining_time": "0:36:40", "throughput": 5781.55, "total_tokens": 9396296} {"current_steps": 14415, "total_steps": 33920, "loss": 0.4239, "lr": 7.114023932273471e-06, "epoch": 8.49941037735849, "percentage": 42.5, "elapsed_time": "0:27:05", "remaining_time": "0:36:39", "throughput": 5781.31, "total_tokens": 9398408} {"current_steps": 14420, "total_steps": 33920, "loss": 0.3825, "lr": 7.111692205525871e-06, "epoch": 8.502358490566039, "percentage": 42.51, "elapsed_time": "0:27:06", "remaining_time": "0:36:39", "throughput": 5781.32, "total_tokens": 9401352} {"current_steps": 14425, "total_steps": 33920, "loss": 0.4372, "lr": 7.109359919698658e-06, "epoch": 8.505306603773585, "percentage": 42.53, "elapsed_time": "0:27:06", "remaining_time": "0:36:38", "throughput": 5781.44, "total_tokens": 9404360} {"current_steps": 14430, "total_steps": 33920, "loss": 0.3583, "lr": 7.107027075409316e-06, "epoch": 8.508254716981131, "percentage": 42.54, "elapsed_time": "0:27:07", "remaining_time": "0:36:37", "throughput": 5781.38, "total_tokens": 9407080} {"current_steps": 14435, "total_steps": 33920, "loss": 0.5223, "lr": 7.104693673275475e-06, "epoch": 8.51120283018868, "percentage": 42.56, "elapsed_time": "0:27:07", "remaining_time": "0:36:37", "throughput": 5781.56, "total_tokens": 9410216} {"current_steps": 14440, "total_steps": 33920, "loss": 0.53, "lr": 7.1023597139149115e-06, "epoch": 8.514150943396226, "percentage": 42.57, "elapsed_time": "0:27:08", "remaining_time": "0:36:36", "throughput": 5781.66, "total_tokens": 9413352} {"current_steps": 14445, "total_steps": 33920, "loss": 0.2691, "lr": 7.100025197945555e-06, "epoch": 8.517099056603774, "percentage": 42.59, "elapsed_time": "0:27:08", "remaining_time": "0:36:35", "throughput": 5781.97, "total_tokens": 9417128} {"current_steps": 14450, "total_steps": 33920, "loss": 0.3329, "lr": 7.097690125985476e-06, "epoch": 8.52004716981132, "percentage": 42.6, "elapsed_time": "0:27:09", "remaining_time": "0:36:35", "throughput": 5781.89, "total_tokens": 9419656} {"current_steps": 14455, "total_steps": 33920, "loss": 0.4832, "lr": 7.095354498652895e-06, "epoch": 8.522995283018869, "percentage": 42.61, "elapsed_time": "0:27:09", "remaining_time": "0:36:34", "throughput": 5781.89, "total_tokens": 9422568} {"current_steps": 14460, "total_steps": 33920, "loss": 0.3866, "lr": 7.093018316566182e-06, "epoch": 8.525943396226415, "percentage": 42.63, "elapsed_time": "0:27:10", "remaining_time": "0:36:33", "throughput": 5781.74, "total_tokens": 9425032} {"current_steps": 14465, "total_steps": 33920, "loss": 0.5568, "lr": 7.0906815803438465e-06, "epoch": 8.528891509433961, "percentage": 42.64, "elapsed_time": "0:27:10", "remaining_time": "0:36:33", "throughput": 5781.96, "total_tokens": 9428904} {"current_steps": 14470, "total_steps": 33920, "loss": 0.4224, "lr": 7.088344290604554e-06, "epoch": 8.53183962264151, "percentage": 42.66, "elapsed_time": "0:27:11", "remaining_time": "0:36:32", "throughput": 5782.02, "total_tokens": 9431912} {"current_steps": 14475, "total_steps": 33920, "loss": 0.3612, "lr": 7.086006447967111e-06, "epoch": 8.534787735849056, "percentage": 42.67, "elapsed_time": "0:27:11", "remaining_time": "0:36:32", "throughput": 5782.32, "total_tokens": 9435464} {"current_steps": 14480, "total_steps": 33920, "loss": 0.5258, "lr": 7.08366805305047e-06, "epoch": 8.537735849056604, "percentage": 42.69, "elapsed_time": "0:27:12", "remaining_time": "0:36:31", "throughput": 5782.09, "total_tokens": 9437832} {"current_steps": 14485, "total_steps": 33920, "loss": 0.4489, "lr": 7.08132910647373e-06, "epoch": 8.54068396226415, "percentage": 42.7, "elapsed_time": "0:27:12", "remaining_time": "0:36:30", "throughput": 5782.0, "total_tokens": 9440328} {"current_steps": 14490, "total_steps": 33920, "loss": 0.3863, "lr": 7.078989608856142e-06, "epoch": 8.543632075471699, "percentage": 42.72, "elapsed_time": "0:27:13", "remaining_time": "0:36:30", "throughput": 5782.07, "total_tokens": 9443304} {"current_steps": 14495, "total_steps": 33920, "loss": 0.4744, "lr": 7.076649560817092e-06, "epoch": 8.546580188679245, "percentage": 42.73, "elapsed_time": "0:27:14", "remaining_time": "0:36:29", "throughput": 5782.61, "total_tokens": 9449608} {"current_steps": 14500, "total_steps": 33920, "loss": 0.342, "lr": 7.0743089629761245e-06, "epoch": 8.549528301886792, "percentage": 42.75, "elapsed_time": "0:27:14", "remaining_time": "0:36:29", "throughput": 5782.7, "total_tokens": 9452520} {"current_steps": 14505, "total_steps": 33920, "loss": 0.288, "lr": 7.071967815952917e-06, "epoch": 8.55247641509434, "percentage": 42.76, "elapsed_time": "0:27:15", "remaining_time": "0:36:28", "throughput": 5782.45, "total_tokens": 9454728} {"current_steps": 14510, "total_steps": 33920, "loss": 0.3987, "lr": 7.0696261203673e-06, "epoch": 8.555424528301886, "percentage": 42.78, "elapsed_time": "0:27:15", "remaining_time": "0:36:27", "throughput": 5782.57, "total_tokens": 9457832} {"current_steps": 14515, "total_steps": 33920, "loss": 0.3172, "lr": 7.067283876839249e-06, "epoch": 8.558372641509434, "percentage": 42.79, "elapsed_time": "0:27:16", "remaining_time": "0:36:27", "throughput": 5782.46, "total_tokens": 9460424} {"current_steps": 14520, "total_steps": 33920, "loss": 0.4047, "lr": 7.064941085988884e-06, "epoch": 8.56132075471698, "percentage": 42.81, "elapsed_time": "0:27:16", "remaining_time": "0:36:26", "throughput": 5782.7, "total_tokens": 9463848} {"current_steps": 14525, "total_steps": 33920, "loss": 0.3855, "lr": 7.062597748436464e-06, "epoch": 8.564268867924529, "percentage": 42.82, "elapsed_time": "0:27:17", "remaining_time": "0:36:25", "throughput": 5783.01, "total_tokens": 9467368} {"current_steps": 14530, "total_steps": 33920, "loss": 0.4486, "lr": 7.060253864802402e-06, "epoch": 8.567216981132075, "percentage": 42.84, "elapsed_time": "0:27:17", "remaining_time": "0:36:25", "throughput": 5783.03, "total_tokens": 9470280} {"current_steps": 14535, "total_steps": 33920, "loss": 0.2998, "lr": 7.05790943570725e-06, "epoch": 8.570165094339622, "percentage": 42.85, "elapsed_time": "0:27:18", "remaining_time": "0:36:24", "throughput": 5783.0, "total_tokens": 9473128} {"current_steps": 14540, "total_steps": 33920, "loss": 0.3409, "lr": 7.055564461771704e-06, "epoch": 8.57311320754717, "percentage": 42.87, "elapsed_time": "0:27:18", "remaining_time": "0:36:24", "throughput": 5783.31, "total_tokens": 9477224} {"current_steps": 14545, "total_steps": 33920, "loss": 0.3431, "lr": 7.053218943616611e-06, "epoch": 8.576061320754716, "percentage": 42.88, "elapsed_time": "0:27:19", "remaining_time": "0:36:23", "throughput": 5783.49, "total_tokens": 9480488} {"current_steps": 14550, "total_steps": 33920, "loss": 0.3548, "lr": 7.050872881862952e-06, "epoch": 8.579009433962264, "percentage": 42.9, "elapsed_time": "0:27:19", "remaining_time": "0:36:22", "throughput": 5783.61, "total_tokens": 9483752} {"current_steps": 14555, "total_steps": 33920, "loss": 0.3602, "lr": 7.04852627713186e-06, "epoch": 8.58195754716981, "percentage": 42.91, "elapsed_time": "0:27:20", "remaining_time": "0:36:22", "throughput": 5783.85, "total_tokens": 9487144} {"current_steps": 14560, "total_steps": 33920, "loss": 0.3691, "lr": 7.0461791300446055e-06, "epoch": 8.584905660377359, "percentage": 42.92, "elapsed_time": "0:27:20", "remaining_time": "0:36:21", "throughput": 5783.91, "total_tokens": 9489960} {"current_steps": 14565, "total_steps": 33920, "loss": 0.5597, "lr": 7.043831441222611e-06, "epoch": 8.587853773584905, "percentage": 42.94, "elapsed_time": "0:27:21", "remaining_time": "0:36:21", "throughput": 5784.36, "total_tokens": 9494568} {"current_steps": 14570, "total_steps": 33920, "loss": 0.447, "lr": 7.04148321128743e-06, "epoch": 8.590801886792454, "percentage": 42.95, "elapsed_time": "0:27:21", "remaining_time": "0:36:20", "throughput": 5784.55, "total_tokens": 9498216} {"current_steps": 14575, "total_steps": 33920, "loss": 0.4238, "lr": 7.039134440860773e-06, "epoch": 8.59375, "percentage": 42.97, "elapsed_time": "0:27:22", "remaining_time": "0:36:20", "throughput": 5784.86, "total_tokens": 9502408} {"current_steps": 14580, "total_steps": 33920, "loss": 0.3865, "lr": 7.036785130564484e-06, "epoch": 8.596698113207546, "percentage": 42.98, "elapsed_time": "0:27:23", "remaining_time": "0:36:19", "throughput": 5784.87, "total_tokens": 9505320} {"current_steps": 14585, "total_steps": 33920, "loss": 0.432, "lr": 7.0344352810205544e-06, "epoch": 8.599646226415095, "percentage": 43.0, "elapsed_time": "0:27:23", "remaining_time": "0:36:18", "throughput": 5784.91, "total_tokens": 9508232} {"current_steps": 14590, "total_steps": 33920, "loss": 0.3003, "lr": 7.032084892851115e-06, "epoch": 8.602594339622641, "percentage": 43.01, "elapsed_time": "0:27:24", "remaining_time": "0:36:18", "throughput": 5785.06, "total_tokens": 9511336} {"current_steps": 14595, "total_steps": 33920, "loss": 0.4037, "lr": 7.0297339666784425e-06, "epoch": 8.60554245283019, "percentage": 43.03, "elapsed_time": "0:27:24", "remaining_time": "0:36:17", "throughput": 5785.2, "total_tokens": 9514600} {"current_steps": 14600, "total_steps": 33920, "loss": 0.3441, "lr": 7.0273825031249556e-06, "epoch": 8.608490566037736, "percentage": 43.04, "elapsed_time": "0:27:25", "remaining_time": "0:36:16", "throughput": 5785.28, "total_tokens": 9517608} {"current_steps": 14605, "total_steps": 33920, "loss": 0.296, "lr": 7.025030502813213e-06, "epoch": 8.611438679245284, "percentage": 43.06, "elapsed_time": "0:27:25", "remaining_time": "0:36:16", "throughput": 5785.5, "total_tokens": 9521000} {"current_steps": 14610, "total_steps": 33920, "loss": 0.4603, "lr": 7.022677966365917e-06, "epoch": 8.61438679245283, "percentage": 43.07, "elapsed_time": "0:27:26", "remaining_time": "0:36:15", "throughput": 5785.49, "total_tokens": 9523720} {"current_steps": 14615, "total_steps": 33920, "loss": 0.3647, "lr": 7.020324894405913e-06, "epoch": 8.617334905660378, "percentage": 43.09, "elapsed_time": "0:27:26", "remaining_time": "0:36:15", "throughput": 5785.68, "total_tokens": 9527080} {"current_steps": 14620, "total_steps": 33920, "loss": 0.4807, "lr": 7.017971287556185e-06, "epoch": 8.620283018867925, "percentage": 43.1, "elapsed_time": "0:27:27", "remaining_time": "0:36:14", "throughput": 5786.1, "total_tokens": 9531368} {"current_steps": 14625, "total_steps": 33920, "loss": 0.3272, "lr": 7.015617146439863e-06, "epoch": 8.623231132075471, "percentage": 43.12, "elapsed_time": "0:27:27", "remaining_time": "0:36:13", "throughput": 5786.2, "total_tokens": 9534376} {"current_steps": 14630, "total_steps": 33920, "loss": 0.4818, "lr": 7.0132624716802125e-06, "epoch": 8.62617924528302, "percentage": 43.13, "elapsed_time": "0:27:28", "remaining_time": "0:36:13", "throughput": 5786.49, "total_tokens": 9538504} {"current_steps": 14635, "total_steps": 33920, "loss": 0.3811, "lr": 7.0109072639006474e-06, "epoch": 8.629127358490566, "percentage": 43.15, "elapsed_time": "0:27:28", "remaining_time": "0:36:12", "throughput": 5786.58, "total_tokens": 9541864} {"current_steps": 14640, "total_steps": 33920, "loss": 0.4787, "lr": 7.008551523724717e-06, "epoch": 8.632075471698114, "percentage": 43.16, "elapsed_time": "0:27:29", "remaining_time": "0:36:12", "throughput": 5786.6, "total_tokens": 9544712} {"current_steps": 14645, "total_steps": 33920, "loss": 0.4003, "lr": 7.006195251776116e-06, "epoch": 8.63502358490566, "percentage": 43.18, "elapsed_time": "0:27:29", "remaining_time": "0:36:11", "throughput": 5786.38, "total_tokens": 9547016} {"current_steps": 14650, "total_steps": 33920, "loss": 0.3155, "lr": 7.003838448678674e-06, "epoch": 8.637971698113208, "percentage": 43.19, "elapsed_time": "0:27:30", "remaining_time": "0:36:10", "throughput": 5786.31, "total_tokens": 9549736} {"current_steps": 14655, "total_steps": 33920, "loss": 0.4608, "lr": 7.0014811150563675e-06, "epoch": 8.640919811320755, "percentage": 43.2, "elapsed_time": "0:27:30", "remaining_time": "0:36:10", "throughput": 5786.46, "total_tokens": 9552936} {"current_steps": 14660, "total_steps": 33920, "loss": 0.4517, "lr": 6.999123251533311e-06, "epoch": 8.643867924528301, "percentage": 43.22, "elapsed_time": "0:27:31", "remaining_time": "0:36:09", "throughput": 5786.78, "total_tokens": 9557064} {"current_steps": 14665, "total_steps": 33920, "loss": 0.4811, "lr": 6.996764858733756e-06, "epoch": 8.64681603773585, "percentage": 43.23, "elapsed_time": "0:27:32", "remaining_time": "0:36:09", "throughput": 5787.16, "total_tokens": 9560968} {"current_steps": 14670, "total_steps": 33920, "loss": 0.4053, "lr": 6.994405937282099e-06, "epoch": 8.649764150943396, "percentage": 43.25, "elapsed_time": "0:27:32", "remaining_time": "0:36:08", "throughput": 5787.41, "total_tokens": 9564680} {"current_steps": 14675, "total_steps": 33920, "loss": 0.4502, "lr": 6.9920464878028745e-06, "epoch": 8.652712264150944, "percentage": 43.26, "elapsed_time": "0:27:33", "remaining_time": "0:36:08", "throughput": 5787.48, "total_tokens": 9567944} {"current_steps": 14680, "total_steps": 33920, "loss": 0.4961, "lr": 6.989686510920758e-06, "epoch": 8.65566037735849, "percentage": 43.28, "elapsed_time": "0:27:33", "remaining_time": "0:36:07", "throughput": 5787.66, "total_tokens": 9571272} {"current_steps": 14685, "total_steps": 33920, "loss": 0.3187, "lr": 6.9873260072605634e-06, "epoch": 8.658608490566039, "percentage": 43.29, "elapsed_time": "0:27:34", "remaining_time": "0:36:07", "throughput": 5788.08, "total_tokens": 9576104} {"current_steps": 14690, "total_steps": 33920, "loss": 0.4937, "lr": 6.984964977447243e-06, "epoch": 8.661556603773585, "percentage": 43.31, "elapsed_time": "0:27:34", "remaining_time": "0:36:06", "throughput": 5788.05, "total_tokens": 9578920} {"current_steps": 14695, "total_steps": 33920, "loss": 0.3695, "lr": 6.982603422105889e-06, "epoch": 8.664504716981131, "percentage": 43.32, "elapsed_time": "0:27:35", "remaining_time": "0:36:06", "throughput": 5788.44, "total_tokens": 9584136} {"current_steps": 14700, "total_steps": 33920, "loss": 0.4547, "lr": 6.980241341861736e-06, "epoch": 8.66745283018868, "percentage": 43.34, "elapsed_time": "0:27:36", "remaining_time": "0:36:06", "throughput": 5788.68, "total_tokens": 9589768} {"current_steps": 14705, "total_steps": 33920, "loss": 0.4855, "lr": 6.977878737340153e-06, "epoch": 8.670400943396226, "percentage": 43.35, "elapsed_time": "0:27:37", "remaining_time": "0:36:06", "throughput": 5789.17, "total_tokens": 9596744} {"current_steps": 14710, "total_steps": 33920, "loss": 0.3848, "lr": 6.97551560916665e-06, "epoch": 8.673349056603774, "percentage": 43.37, "elapsed_time": "0:27:38", "remaining_time": "0:36:05", "throughput": 5789.43, "total_tokens": 9600520} {"current_steps": 14715, "total_steps": 33920, "loss": 0.5385, "lr": 6.973151957966875e-06, "epoch": 8.67629716981132, "percentage": 43.38, "elapsed_time": "0:27:38", "remaining_time": "0:36:04", "throughput": 5789.49, "total_tokens": 9603432} {"current_steps": 14720, "total_steps": 33920, "loss": 0.4285, "lr": 6.970787784366616e-06, "epoch": 8.679245283018869, "percentage": 43.4, "elapsed_time": "0:27:39", "remaining_time": "0:36:04", "throughput": 5789.65, "total_tokens": 9607208} {"current_steps": 14725, "total_steps": 33920, "loss": 0.3787, "lr": 6.968423088991797e-06, "epoch": 8.682193396226415, "percentage": 43.41, "elapsed_time": "0:27:39", "remaining_time": "0:36:03", "throughput": 5789.67, "total_tokens": 9610088} {"current_steps": 14730, "total_steps": 33920, "loss": 0.399, "lr": 6.966057872468481e-06, "epoch": 8.685141509433961, "percentage": 43.43, "elapsed_time": "0:27:40", "remaining_time": "0:36:03", "throughput": 5789.87, "total_tokens": 9613288} {"current_steps": 14735, "total_steps": 33920, "loss": 0.4141, "lr": 6.963692135422872e-06, "epoch": 8.68808962264151, "percentage": 43.44, "elapsed_time": "0:27:41", "remaining_time": "0:36:02", "throughput": 5790.21, "total_tokens": 9617928} {"current_steps": 14740, "total_steps": 33920, "loss": 0.3259, "lr": 6.961325878481305e-06, "epoch": 8.691037735849056, "percentage": 43.46, "elapsed_time": "0:27:41", "remaining_time": "0:36:02", "throughput": 5790.28, "total_tokens": 9620712} {"current_steps": 14745, "total_steps": 33920, "loss": 0.5477, "lr": 6.958959102270259e-06, "epoch": 8.693985849056604, "percentage": 43.47, "elapsed_time": "0:27:42", "remaining_time": "0:36:01", "throughput": 5790.45, "total_tokens": 9623784} {"current_steps": 14750, "total_steps": 33920, "loss": 0.3008, "lr": 6.95659180741635e-06, "epoch": 8.69693396226415, "percentage": 43.48, "elapsed_time": "0:27:42", "remaining_time": "0:36:00", "throughput": 5790.54, "total_tokens": 9626856} {"current_steps": 14755, "total_steps": 33920, "loss": 0.4244, "lr": 6.954223994546326e-06, "epoch": 8.699882075471699, "percentage": 43.5, "elapsed_time": "0:27:43", "remaining_time": "0:36:00", "throughput": 5790.59, "total_tokens": 9629800} {"current_steps": 14760, "total_steps": 33920, "loss": 0.3438, "lr": 6.951855664287077e-06, "epoch": 8.702830188679245, "percentage": 43.51, "elapsed_time": "0:27:43", "remaining_time": "0:35:59", "throughput": 5790.81, "total_tokens": 9633384} {"current_steps": 14765, "total_steps": 33920, "loss": 0.3257, "lr": 6.9494868172656304e-06, "epoch": 8.705778301886792, "percentage": 43.53, "elapsed_time": "0:27:44", "remaining_time": "0:35:58", "throughput": 5790.95, "total_tokens": 9636872} {"current_steps": 14770, "total_steps": 33920, "loss": 0.3777, "lr": 6.947117454109146e-06, "epoch": 8.70872641509434, "percentage": 43.54, "elapsed_time": "0:27:44", "remaining_time": "0:35:58", "throughput": 5791.0, "total_tokens": 9639720} {"current_steps": 14775, "total_steps": 33920, "loss": 0.567, "lr": 6.944747575444924e-06, "epoch": 8.711674528301886, "percentage": 43.56, "elapsed_time": "0:27:45", "remaining_time": "0:35:57", "throughput": 5791.07, "total_tokens": 9642600} {"current_steps": 14780, "total_steps": 33920, "loss": 0.3753, "lr": 6.942377181900399e-06, "epoch": 8.714622641509434, "percentage": 43.57, "elapsed_time": "0:27:45", "remaining_time": "0:35:57", "throughput": 5791.39, "total_tokens": 9646568} {"current_steps": 14785, "total_steps": 33920, "loss": 0.3925, "lr": 6.940006274103146e-06, "epoch": 8.71757075471698, "percentage": 43.59, "elapsed_time": "0:27:46", "remaining_time": "0:35:56", "throughput": 5791.39, "total_tokens": 9649448} {"current_steps": 14790, "total_steps": 33920, "loss": 0.4324, "lr": 6.93763485268087e-06, "epoch": 8.720518867924529, "percentage": 43.6, "elapsed_time": "0:27:46", "remaining_time": "0:35:55", "throughput": 5791.26, "total_tokens": 9652008} {"current_steps": 14795, "total_steps": 33920, "loss": 0.3284, "lr": 6.935262918261416e-06, "epoch": 8.723466981132075, "percentage": 43.62, "elapsed_time": "0:27:47", "remaining_time": "0:35:55", "throughput": 5791.37, "total_tokens": 9655048} {"current_steps": 14800, "total_steps": 33920, "loss": 0.5942, "lr": 6.932890471472764e-06, "epoch": 8.726415094339622, "percentage": 43.63, "elapsed_time": "0:27:47", "remaining_time": "0:35:54", "throughput": 5791.44, "total_tokens": 9657960} {"current_steps": 14805, "total_steps": 33920, "loss": 0.4625, "lr": 6.930517512943029e-06, "epoch": 8.72936320754717, "percentage": 43.65, "elapsed_time": "0:27:48", "remaining_time": "0:35:53", "throughput": 5791.65, "total_tokens": 9661224} {"current_steps": 14810, "total_steps": 33920, "loss": 0.2971, "lr": 6.928144043300463e-06, "epoch": 8.732311320754716, "percentage": 43.66, "elapsed_time": "0:27:48", "remaining_time": "0:35:53", "throughput": 5791.78, "total_tokens": 9664392} {"current_steps": 14815, "total_steps": 33920, "loss": 0.5073, "lr": 6.925770063173451e-06, "epoch": 8.735259433962264, "percentage": 43.68, "elapsed_time": "0:27:49", "remaining_time": "0:35:52", "throughput": 5792.22, "total_tokens": 9668904} {"current_steps": 14820, "total_steps": 33920, "loss": 0.3598, "lr": 6.923395573190514e-06, "epoch": 8.73820754716981, "percentage": 43.69, "elapsed_time": "0:27:49", "remaining_time": "0:35:52", "throughput": 5792.43, "total_tokens": 9672424} {"current_steps": 14825, "total_steps": 33920, "loss": 0.3798, "lr": 6.921020573980313e-06, "epoch": 8.741155660377359, "percentage": 43.71, "elapsed_time": "0:27:50", "remaining_time": "0:35:51", "throughput": 5792.54, "total_tokens": 9675624} {"current_steps": 14830, "total_steps": 33920, "loss": 0.3263, "lr": 6.918645066171634e-06, "epoch": 8.744103773584905, "percentage": 43.72, "elapsed_time": "0:27:50", "remaining_time": "0:35:50", "throughput": 5792.74, "total_tokens": 9678920} {"current_steps": 14835, "total_steps": 33920, "loss": 0.3873, "lr": 6.916269050393404e-06, "epoch": 8.747051886792454, "percentage": 43.74, "elapsed_time": "0:27:51", "remaining_time": "0:35:50", "throughput": 5792.66, "total_tokens": 9681448} {"current_steps": 14840, "total_steps": 33920, "loss": 0.5164, "lr": 6.913892527274686e-06, "epoch": 8.75, "percentage": 43.75, "elapsed_time": "0:27:51", "remaining_time": "0:35:49", "throughput": 5792.73, "total_tokens": 9684392} {"current_steps": 14845, "total_steps": 33920, "loss": 0.4245, "lr": 6.9115154974446716e-06, "epoch": 8.752948113207546, "percentage": 43.76, "elapsed_time": "0:27:52", "remaining_time": "0:35:48", "throughput": 5792.82, "total_tokens": 9687720} {"current_steps": 14850, "total_steps": 33920, "loss": 0.2978, "lr": 6.909137961532692e-06, "epoch": 8.755896226415095, "percentage": 43.78, "elapsed_time": "0:27:52", "remaining_time": "0:35:48", "throughput": 5792.81, "total_tokens": 9690632} {"current_steps": 14855, "total_steps": 33920, "loss": 0.4541, "lr": 6.906759920168209e-06, "epoch": 8.758844339622641, "percentage": 43.79, "elapsed_time": "0:27:53", "remaining_time": "0:35:47", "throughput": 5792.89, "total_tokens": 9693544} {"current_steps": 14860, "total_steps": 33920, "loss": 0.382, "lr": 6.90438137398082e-06, "epoch": 8.76179245283019, "percentage": 43.81, "elapsed_time": "0:27:54", "remaining_time": "0:35:47", "throughput": 5793.27, "total_tokens": 9697992} {"current_steps": 14865, "total_steps": 33920, "loss": 0.3407, "lr": 6.902002323600252e-06, "epoch": 8.764740566037736, "percentage": 43.82, "elapsed_time": "0:27:54", "remaining_time": "0:35:46", "throughput": 5793.23, "total_tokens": 9700744} {"current_steps": 14870, "total_steps": 33920, "loss": 0.3362, "lr": 6.899622769656373e-06, "epoch": 8.767688679245284, "percentage": 43.84, "elapsed_time": "0:27:55", "remaining_time": "0:35:45", "throughput": 5793.27, "total_tokens": 9703752} {"current_steps": 14875, "total_steps": 33920, "loss": 0.3287, "lr": 6.897242712779179e-06, "epoch": 8.77063679245283, "percentage": 43.85, "elapsed_time": "0:27:55", "remaining_time": "0:35:45", "throughput": 5793.52, "total_tokens": 9707272} {"current_steps": 14880, "total_steps": 33920, "loss": 0.3483, "lr": 6.894862153598802e-06, "epoch": 8.773584905660378, "percentage": 43.87, "elapsed_time": "0:27:56", "remaining_time": "0:35:44", "throughput": 5793.64, "total_tokens": 9710280} {"current_steps": 14885, "total_steps": 33920, "loss": 0.4507, "lr": 6.892481092745502e-06, "epoch": 8.776533018867925, "percentage": 43.88, "elapsed_time": "0:27:56", "remaining_time": "0:35:44", "throughput": 5793.91, "total_tokens": 9714216} {"current_steps": 14890, "total_steps": 33920, "loss": 0.6275, "lr": 6.890099530849677e-06, "epoch": 8.779481132075471, "percentage": 43.9, "elapsed_time": "0:27:57", "remaining_time": "0:35:43", "throughput": 5794.02, "total_tokens": 9717224} {"current_steps": 14895, "total_steps": 33920, "loss": 0.4574, "lr": 6.887717468541855e-06, "epoch": 8.78242924528302, "percentage": 43.91, "elapsed_time": "0:27:57", "remaining_time": "0:35:42", "throughput": 5794.21, "total_tokens": 9720872} {"current_steps": 14900, "total_steps": 33920, "loss": 0.4132, "lr": 6.885334906452696e-06, "epoch": 8.785377358490566, "percentage": 43.93, "elapsed_time": "0:27:58", "remaining_time": "0:35:42", "throughput": 5794.19, "total_tokens": 9723624} {"current_steps": 14905, "total_steps": 33920, "loss": 0.3908, "lr": 6.882951845212997e-06, "epoch": 8.788325471698114, "percentage": 43.94, "elapsed_time": "0:27:58", "remaining_time": "0:35:41", "throughput": 5794.1, "total_tokens": 9726248} {"current_steps": 14910, "total_steps": 33920, "loss": 0.4575, "lr": 6.880568285453682e-06, "epoch": 8.79127358490566, "percentage": 43.96, "elapsed_time": "0:27:59", "remaining_time": "0:35:40", "throughput": 5793.9, "total_tokens": 9728456} {"current_steps": 14915, "total_steps": 33920, "loss": 0.3126, "lr": 6.878184227805807e-06, "epoch": 8.794221698113208, "percentage": 43.97, "elapsed_time": "0:27:59", "remaining_time": "0:35:40", "throughput": 5794.22, "total_tokens": 9732360} {"current_steps": 14920, "total_steps": 33920, "loss": 0.3775, "lr": 6.8757996729005645e-06, "epoch": 8.797169811320755, "percentage": 43.99, "elapsed_time": "0:28:00", "remaining_time": "0:35:39", "throughput": 5794.39, "total_tokens": 9736072} {"current_steps": 14925, "total_steps": 33920, "loss": 0.356, "lr": 6.8734146213692756e-06, "epoch": 8.800117924528301, "percentage": 44.0, "elapsed_time": "0:28:00", "remaining_time": "0:35:39", "throughput": 5794.39, "total_tokens": 9738856} {"current_steps": 14930, "total_steps": 33920, "loss": 0.3749, "lr": 6.87102907384339e-06, "epoch": 8.80306603773585, "percentage": 44.02, "elapsed_time": "0:28:01", "remaining_time": "0:35:38", "throughput": 5794.49, "total_tokens": 9741992} {"current_steps": 14935, "total_steps": 33920, "loss": 0.4098, "lr": 6.868643030954494e-06, "epoch": 8.806014150943396, "percentage": 44.03, "elapsed_time": "0:28:01", "remaining_time": "0:35:37", "throughput": 5794.72, "total_tokens": 9745896} {"current_steps": 14940, "total_steps": 33920, "loss": 0.4265, "lr": 6.866256493334302e-06, "epoch": 8.808962264150944, "percentage": 44.04, "elapsed_time": "0:28:02", "remaining_time": "0:35:37", "throughput": 5795.01, "total_tokens": 9749576} {"current_steps": 14945, "total_steps": 33920, "loss": 0.3347, "lr": 6.863869461614659e-06, "epoch": 8.81191037735849, "percentage": 44.06, "elapsed_time": "0:28:03", "remaining_time": "0:35:36", "throughput": 5795.26, "total_tokens": 9753672} {"current_steps": 14950, "total_steps": 33920, "loss": 0.3544, "lr": 6.861481936427545e-06, "epoch": 8.814858490566039, "percentage": 44.07, "elapsed_time": "0:28:03", "remaining_time": "0:35:36", "throughput": 5795.53, "total_tokens": 9757320} {"current_steps": 14955, "total_steps": 33920, "loss": 0.3839, "lr": 6.859093918405067e-06, "epoch": 8.817806603773585, "percentage": 44.09, "elapsed_time": "0:28:04", "remaining_time": "0:35:35", "throughput": 5795.57, "total_tokens": 9760328} {"current_steps": 14960, "total_steps": 33920, "loss": 0.5049, "lr": 6.856705408179458e-06, "epoch": 8.820754716981131, "percentage": 44.1, "elapsed_time": "0:28:04", "remaining_time": "0:35:35", "throughput": 5795.68, "total_tokens": 9763496} {"current_steps": 14965, "total_steps": 33920, "loss": 0.419, "lr": 6.854316406383093e-06, "epoch": 8.82370283018868, "percentage": 44.12, "elapsed_time": "0:28:05", "remaining_time": "0:35:34", "throughput": 5796.01, "total_tokens": 9767592} {"current_steps": 14970, "total_steps": 33920, "loss": 0.4227, "lr": 6.8519269136484665e-06, "epoch": 8.826650943396226, "percentage": 44.13, "elapsed_time": "0:28:05", "remaining_time": "0:35:33", "throughput": 5796.04, "total_tokens": 9770440} {"current_steps": 14975, "total_steps": 33920, "loss": 0.389, "lr": 6.849536930608208e-06, "epoch": 8.829599056603774, "percentage": 44.15, "elapsed_time": "0:28:06", "remaining_time": "0:35:33", "throughput": 5795.79, "total_tokens": 9772552} {"current_steps": 14980, "total_steps": 33920, "loss": 0.3432, "lr": 6.847146457895078e-06, "epoch": 8.83254716981132, "percentage": 44.16, "elapsed_time": "0:28:06", "remaining_time": "0:35:32", "throughput": 5795.9, "total_tokens": 9775752} {"current_steps": 14985, "total_steps": 33920, "loss": 0.3584, "lr": 6.8447554961419615e-06, "epoch": 8.835495283018869, "percentage": 44.18, "elapsed_time": "0:28:07", "remaining_time": "0:35:31", "throughput": 5795.98, "total_tokens": 9778760} {"current_steps": 14990, "total_steps": 33920, "loss": 0.313, "lr": 6.842364045981876e-06, "epoch": 8.838443396226415, "percentage": 44.19, "elapsed_time": "0:28:07", "remaining_time": "0:35:31", "throughput": 5796.14, "total_tokens": 9782280} {"current_steps": 14995, "total_steps": 33920, "loss": 0.3883, "lr": 6.83997210804797e-06, "epoch": 8.841391509433961, "percentage": 44.21, "elapsed_time": "0:28:08", "remaining_time": "0:35:30", "throughput": 5796.51, "total_tokens": 9786440} {"current_steps": 15000, "total_steps": 33920, "loss": 0.4152, "lr": 6.837579682973519e-06, "epoch": 8.84433962264151, "percentage": 44.22, "elapsed_time": "0:28:08", "remaining_time": "0:35:30", "throughput": 5796.71, "total_tokens": 9789832} {"current_steps": 15005, "total_steps": 33920, "loss": 0.2716, "lr": 6.835186771391926e-06, "epoch": 8.847287735849056, "percentage": 44.24, "elapsed_time": "0:28:09", "remaining_time": "0:35:29", "throughput": 5796.6, "total_tokens": 9792360} {"current_steps": 15010, "total_steps": 33920, "loss": 0.4118, "lr": 6.8327933739367266e-06, "epoch": 8.850235849056604, "percentage": 44.25, "elapsed_time": "0:28:09", "remaining_time": "0:35:28", "throughput": 5796.47, "total_tokens": 9794824} {"current_steps": 15015, "total_steps": 33920, "loss": 0.2922, "lr": 6.830399491241584e-06, "epoch": 8.85318396226415, "percentage": 44.27, "elapsed_time": "0:28:10", "remaining_time": "0:35:28", "throughput": 5796.72, "total_tokens": 9798280} {"current_steps": 15020, "total_steps": 33920, "loss": 0.3109, "lr": 6.828005123940287e-06, "epoch": 8.856132075471699, "percentage": 44.28, "elapsed_time": "0:28:11", "remaining_time": "0:35:27", "throughput": 5797.33, "total_tokens": 9803720} {"current_steps": 15025, "total_steps": 33920, "loss": 0.4407, "lr": 6.825610272666754e-06, "epoch": 8.859080188679245, "percentage": 44.3, "elapsed_time": "0:28:11", "remaining_time": "0:35:27", "throughput": 5797.39, "total_tokens": 9806504} {"current_steps": 15030, "total_steps": 33920, "loss": 0.4007, "lr": 6.823214938055034e-06, "epoch": 8.862028301886792, "percentage": 44.31, "elapsed_time": "0:28:11", "remaining_time": "0:35:26", "throughput": 5797.41, "total_tokens": 9809192} {"current_steps": 15035, "total_steps": 33920, "loss": 0.48, "lr": 6.8208191207393e-06, "epoch": 8.86497641509434, "percentage": 44.32, "elapsed_time": "0:28:12", "remaining_time": "0:35:25", "throughput": 5797.43, "total_tokens": 9812008} {"current_steps": 15040, "total_steps": 33920, "loss": 0.3435, "lr": 6.818422821353859e-06, "epoch": 8.867924528301886, "percentage": 44.34, "elapsed_time": "0:28:13", "remaining_time": "0:35:25", "throughput": 5797.67, "total_tokens": 9815464} {"current_steps": 15045, "total_steps": 33920, "loss": 0.4625, "lr": 6.816026040533139e-06, "epoch": 8.870872641509434, "percentage": 44.35, "elapsed_time": "0:28:13", "remaining_time": "0:35:24", "throughput": 5797.79, "total_tokens": 9818888} {"current_steps": 15050, "total_steps": 33920, "loss": 0.3678, "lr": 6.8136287789116966e-06, "epoch": 8.87382075471698, "percentage": 44.37, "elapsed_time": "0:28:14", "remaining_time": "0:35:24", "throughput": 5797.96, "total_tokens": 9822952} {"current_steps": 15055, "total_steps": 33920, "loss": 0.4056, "lr": 6.81123103712422e-06, "epoch": 8.876768867924529, "percentage": 44.38, "elapsed_time": "0:28:14", "remaining_time": "0:35:23", "throughput": 5798.32, "total_tokens": 9827144} {"current_steps": 15060, "total_steps": 33920, "loss": 0.3675, "lr": 6.808832815805518e-06, "epoch": 8.879716981132075, "percentage": 44.4, "elapsed_time": "0:28:15", "remaining_time": "0:35:23", "throughput": 5798.53, "total_tokens": 9830440} {"current_steps": 15065, "total_steps": 33920, "loss": 0.443, "lr": 6.806434115590534e-06, "epoch": 8.882665094339622, "percentage": 44.41, "elapsed_time": "0:28:15", "remaining_time": "0:35:22", "throughput": 5798.52, "total_tokens": 9833192} {"current_steps": 15070, "total_steps": 33920, "loss": 0.3941, "lr": 6.804034937114332e-06, "epoch": 8.88561320754717, "percentage": 44.43, "elapsed_time": "0:28:16", "remaining_time": "0:35:21", "throughput": 5798.5, "total_tokens": 9835880} {"current_steps": 15075, "total_steps": 33920, "loss": 0.3446, "lr": 6.8016352810121064e-06, "epoch": 8.888561320754716, "percentage": 44.44, "elapsed_time": "0:28:16", "remaining_time": "0:35:21", "throughput": 5798.27, "total_tokens": 9838248} {"current_steps": 15080, "total_steps": 33920, "loss": 0.4545, "lr": 6.799235147919176e-06, "epoch": 8.891509433962264, "percentage": 44.46, "elapsed_time": "0:28:17", "remaining_time": "0:35:20", "throughput": 5798.42, "total_tokens": 9841480} {"current_steps": 15085, "total_steps": 33920, "loss": 0.4262, "lr": 6.796834538470985e-06, "epoch": 8.89445754716981, "percentage": 44.47, "elapsed_time": "0:28:17", "remaining_time": "0:35:19", "throughput": 5798.46, "total_tokens": 9844392} {"current_steps": 15090, "total_steps": 33920, "loss": 0.4196, "lr": 6.794433453303106e-06, "epoch": 8.897405660377359, "percentage": 44.49, "elapsed_time": "0:28:18", "remaining_time": "0:35:19", "throughput": 5798.47, "total_tokens": 9847848} {"current_steps": 15095, "total_steps": 33920, "loss": 0.4999, "lr": 6.792031893051238e-06, "epoch": 8.900353773584905, "percentage": 44.5, "elapsed_time": "0:28:18", "remaining_time": "0:35:18", "throughput": 5798.53, "total_tokens": 9851432} {"current_steps": 15100, "total_steps": 33920, "loss": 0.3777, "lr": 6.789629858351201e-06, "epoch": 8.903301886792454, "percentage": 44.52, "elapsed_time": "0:28:19", "remaining_time": "0:35:18", "throughput": 5798.77, "total_tokens": 9854984} {"current_steps": 15105, "total_steps": 33920, "loss": 0.4076, "lr": 6.787227349838946e-06, "epoch": 8.90625, "percentage": 44.53, "elapsed_time": "0:28:19", "remaining_time": "0:35:17", "throughput": 5798.81, "total_tokens": 9857800} {"current_steps": 15110, "total_steps": 33920, "loss": 0.3255, "lr": 6.784824368150548e-06, "epoch": 8.909198113207546, "percentage": 44.55, "elapsed_time": "0:28:20", "remaining_time": "0:35:16", "throughput": 5798.62, "total_tokens": 9860296} {"current_steps": 15115, "total_steps": 33920, "loss": 0.3604, "lr": 6.7824209139222076e-06, "epoch": 8.912146226415095, "percentage": 44.56, "elapsed_time": "0:28:20", "remaining_time": "0:35:16", "throughput": 5798.61, "total_tokens": 9862984} {"current_steps": 15120, "total_steps": 33920, "loss": 0.3428, "lr": 6.780016987790248e-06, "epoch": 8.915094339622641, "percentage": 44.58, "elapsed_time": "0:28:21", "remaining_time": "0:35:15", "throughput": 5798.65, "total_tokens": 9866120} {"current_steps": 15125, "total_steps": 33920, "loss": 0.4906, "lr": 6.7776125903911194e-06, "epoch": 8.91804245283019, "percentage": 44.59, "elapsed_time": "0:28:22", "remaining_time": "0:35:15", "throughput": 5798.98, "total_tokens": 9870120} {"current_steps": 15130, "total_steps": 33920, "loss": 0.5517, "lr": 6.775207722361396e-06, "epoch": 8.920990566037736, "percentage": 44.6, "elapsed_time": "0:28:22", "remaining_time": "0:35:14", "throughput": 5798.84, "total_tokens": 9872808} {"current_steps": 15135, "total_steps": 33920, "loss": 0.4352, "lr": 6.772802384337778e-06, "epoch": 8.923938679245284, "percentage": 44.62, "elapsed_time": "0:28:23", "remaining_time": "0:35:13", "throughput": 5799.04, "total_tokens": 9876456} {"current_steps": 15140, "total_steps": 33920, "loss": 0.2946, "lr": 6.770396576957088e-06, "epoch": 8.92688679245283, "percentage": 44.63, "elapsed_time": "0:28:23", "remaining_time": "0:35:13", "throughput": 5798.81, "total_tokens": 9878728} {"current_steps": 15145, "total_steps": 33920, "loss": 0.5341, "lr": 6.767990300856274e-06, "epoch": 8.929834905660378, "percentage": 44.65, "elapsed_time": "0:28:24", "remaining_time": "0:35:12", "throughput": 5798.81, "total_tokens": 9881704} {"current_steps": 15150, "total_steps": 33920, "loss": 0.3521, "lr": 6.765583556672408e-06, "epoch": 8.932783018867925, "percentage": 44.66, "elapsed_time": "0:28:24", "remaining_time": "0:35:11", "throughput": 5798.78, "total_tokens": 9884392} {"current_steps": 15155, "total_steps": 33920, "loss": 0.2488, "lr": 6.763176345042687e-06, "epoch": 8.935731132075471, "percentage": 44.68, "elapsed_time": "0:28:25", "remaining_time": "0:35:11", "throughput": 5798.93, "total_tokens": 9887528} {"current_steps": 15160, "total_steps": 33920, "loss": 0.6035, "lr": 6.760768666604429e-06, "epoch": 8.93867924528302, "percentage": 44.69, "elapsed_time": "0:28:25", "remaining_time": "0:35:10", "throughput": 5798.91, "total_tokens": 9890376} {"current_steps": 15165, "total_steps": 33920, "loss": 0.4492, "lr": 6.758360521995079e-06, "epoch": 8.941627358490566, "percentage": 44.71, "elapsed_time": "0:28:26", "remaining_time": "0:35:09", "throughput": 5798.9, "total_tokens": 9893320} {"current_steps": 15170, "total_steps": 33920, "loss": 0.3756, "lr": 6.755951911852202e-06, "epoch": 8.944575471698114, "percentage": 44.72, "elapsed_time": "0:28:26", "remaining_time": "0:35:09", "throughput": 5798.98, "total_tokens": 9896232} {"current_steps": 15175, "total_steps": 33920, "loss": 0.4015, "lr": 6.7535428368134885e-06, "epoch": 8.94752358490566, "percentage": 44.74, "elapsed_time": "0:28:27", "remaining_time": "0:35:08", "throughput": 5799.06, "total_tokens": 9899464} {"current_steps": 15180, "total_steps": 33920, "loss": 0.5217, "lr": 6.751133297516752e-06, "epoch": 8.950471698113208, "percentage": 44.75, "elapsed_time": "0:28:27", "remaining_time": "0:35:08", "throughput": 5799.2, "total_tokens": 9902728} {"current_steps": 15185, "total_steps": 33920, "loss": 0.35, "lr": 6.748723294599928e-06, "epoch": 8.953419811320755, "percentage": 44.77, "elapsed_time": "0:28:28", "remaining_time": "0:35:07", "throughput": 5799.37, "total_tokens": 9906280} {"current_steps": 15190, "total_steps": 33920, "loss": 0.4208, "lr": 6.746312828701075e-06, "epoch": 8.956367924528301, "percentage": 44.78, "elapsed_time": "0:28:28", "remaining_time": "0:35:06", "throughput": 5799.62, "total_tokens": 9909960} {"current_steps": 15195, "total_steps": 33920, "loss": 0.454, "lr": 6.743901900458374e-06, "epoch": 8.95931603773585, "percentage": 44.8, "elapsed_time": "0:28:29", "remaining_time": "0:35:06", "throughput": 5799.59, "total_tokens": 9912744} {"current_steps": 15200, "total_steps": 33920, "loss": 0.3991, "lr": 6.741490510510129e-06, "epoch": 8.962264150943396, "percentage": 44.81, "elapsed_time": "0:28:29", "remaining_time": "0:35:05", "throughput": 5799.74, "total_tokens": 9915976} {"current_steps": 15205, "total_steps": 33920, "loss": 0.2997, "lr": 6.7390786594947665e-06, "epoch": 8.965212264150944, "percentage": 44.83, "elapsed_time": "0:28:30", "remaining_time": "0:35:05", "throughput": 5799.6, "total_tokens": 9918536} {"current_steps": 15210, "total_steps": 33920, "loss": 0.453, "lr": 6.7366663480508335e-06, "epoch": 8.96816037735849, "percentage": 44.84, "elapsed_time": "0:28:30", "remaining_time": "0:35:04", "throughput": 5799.54, "total_tokens": 9921416} {"current_steps": 15215, "total_steps": 33920, "loss": 0.3343, "lr": 6.734253576817002e-06, "epoch": 8.971108490566039, "percentage": 44.86, "elapsed_time": "0:28:31", "remaining_time": "0:35:03", "throughput": 5799.87, "total_tokens": 9925544} {"current_steps": 15220, "total_steps": 33920, "loss": 0.3874, "lr": 6.731840346432061e-06, "epoch": 8.974056603773585, "percentage": 44.87, "elapsed_time": "0:28:31", "remaining_time": "0:35:03", "throughput": 5800.08, "total_tokens": 9928936} {"current_steps": 15225, "total_steps": 33920, "loss": 0.4687, "lr": 6.729426657534922e-06, "epoch": 8.977004716981131, "percentage": 44.89, "elapsed_time": "0:28:32", "remaining_time": "0:35:02", "throughput": 5800.21, "total_tokens": 9931912} {"current_steps": 15230, "total_steps": 33920, "loss": 0.4709, "lr": 6.727012510764624e-06, "epoch": 8.97995283018868, "percentage": 44.9, "elapsed_time": "0:28:32", "remaining_time": "0:35:01", "throughput": 5800.36, "total_tokens": 9934984} {"current_steps": 15235, "total_steps": 33920, "loss": 0.4471, "lr": 6.724597906760322e-06, "epoch": 8.982900943396226, "percentage": 44.91, "elapsed_time": "0:28:33", "remaining_time": "0:35:01", "throughput": 5800.15, "total_tokens": 9937800} {"current_steps": 15240, "total_steps": 33920, "loss": 0.5142, "lr": 6.722182846161289e-06, "epoch": 8.985849056603774, "percentage": 44.93, "elapsed_time": "0:28:33", "remaining_time": "0:35:00", "throughput": 5800.26, "total_tokens": 9940712} {"current_steps": 15245, "total_steps": 33920, "loss": 0.4572, "lr": 6.719767329606926e-06, "epoch": 8.98879716981132, "percentage": 44.94, "elapsed_time": "0:28:34", "remaining_time": "0:35:00", "throughput": 5800.56, "total_tokens": 9944584} {"current_steps": 15250, "total_steps": 33920, "loss": 0.5779, "lr": 6.717351357736751e-06, "epoch": 8.991745283018869, "percentage": 44.96, "elapsed_time": "0:28:34", "remaining_time": "0:34:59", "throughput": 5800.6, "total_tokens": 9947368} {"current_steps": 15255, "total_steps": 33920, "loss": 0.3254, "lr": 6.7149349311904025e-06, "epoch": 8.994693396226415, "percentage": 44.97, "elapsed_time": "0:28:35", "remaining_time": "0:34:58", "throughput": 5800.56, "total_tokens": 9950088} {"current_steps": 15260, "total_steps": 33920, "loss": 0.3661, "lr": 6.712518050607642e-06, "epoch": 8.997641509433961, "percentage": 44.99, "elapsed_time": "0:28:35", "remaining_time": "0:34:58", "throughput": 5800.6, "total_tokens": 9953096} {"current_steps": 15265, "total_steps": 33920, "loss": 0.3108, "lr": 6.710100716628345e-06, "epoch": 9.00058962264151, "percentage": 45.0, "elapsed_time": "0:28:36", "remaining_time": "0:34:57", "throughput": 5799.31, "total_tokens": 9954992} {"current_steps": 15270, "total_steps": 33920, "loss": 0.4337, "lr": 6.707682929892513e-06, "epoch": 9.003537735849056, "percentage": 45.02, "elapsed_time": "0:28:37", "remaining_time": "0:34:57", "throughput": 5799.23, "total_tokens": 9957808} {"current_steps": 15275, "total_steps": 33920, "loss": 0.3454, "lr": 6.705264691040266e-06, "epoch": 9.006485849056604, "percentage": 45.03, "elapsed_time": "0:28:37", "remaining_time": "0:34:56", "throughput": 5799.39, "total_tokens": 9961520} {"current_steps": 15280, "total_steps": 33920, "loss": 0.3543, "lr": 6.7028460007118435e-06, "epoch": 9.00943396226415, "percentage": 45.05, "elapsed_time": "0:28:38", "remaining_time": "0:34:55", "throughput": 5799.41, "total_tokens": 9964144} {"current_steps": 15285, "total_steps": 33920, "loss": 0.2855, "lr": 6.700426859547602e-06, "epoch": 9.012382075471699, "percentage": 45.06, "elapsed_time": "0:28:38", "remaining_time": "0:34:55", "throughput": 5799.47, "total_tokens": 9967056} {"current_steps": 15290, "total_steps": 33920, "loss": 0.3572, "lr": 6.6980072681880224e-06, "epoch": 9.015330188679245, "percentage": 45.08, "elapsed_time": "0:28:39", "remaining_time": "0:34:54", "throughput": 5799.72, "total_tokens": 9970800} {"current_steps": 15295, "total_steps": 33920, "loss": 0.2975, "lr": 6.695587227273699e-06, "epoch": 9.018278301886792, "percentage": 45.09, "elapsed_time": "0:28:39", "remaining_time": "0:34:54", "throughput": 5799.69, "total_tokens": 9973392} {"current_steps": 15300, "total_steps": 33920, "loss": 0.3454, "lr": 6.69316673744535e-06, "epoch": 9.02122641509434, "percentage": 45.11, "elapsed_time": "0:28:40", "remaining_time": "0:34:53", "throughput": 5799.71, "total_tokens": 9976176} {"current_steps": 15305, "total_steps": 33920, "loss": 0.4048, "lr": 6.6907457993438115e-06, "epoch": 9.024174528301886, "percentage": 45.12, "elapsed_time": "0:28:40", "remaining_time": "0:34:52", "throughput": 5799.63, "total_tokens": 9979440} {"current_steps": 15310, "total_steps": 33920, "loss": 0.4487, "lr": 6.688324413610036e-06, "epoch": 9.027122641509434, "percentage": 45.14, "elapsed_time": "0:28:41", "remaining_time": "0:34:52", "throughput": 5799.68, "total_tokens": 9982192} {"current_steps": 15315, "total_steps": 33920, "loss": 0.2786, "lr": 6.685902580885094e-06, "epoch": 9.03007075471698, "percentage": 45.15, "elapsed_time": "0:28:41", "remaining_time": "0:34:51", "throughput": 5799.7, "total_tokens": 9984848} {"current_steps": 15320, "total_steps": 33920, "loss": 0.3064, "lr": 6.6834803018101794e-06, "epoch": 9.033018867924529, "percentage": 45.17, "elapsed_time": "0:28:42", "remaining_time": "0:34:50", "throughput": 5799.7, "total_tokens": 9987568} {"current_steps": 15325, "total_steps": 33920, "loss": 0.3202, "lr": 6.681057577026599e-06, "epoch": 9.035966981132075, "percentage": 45.18, "elapsed_time": "0:28:42", "remaining_time": "0:34:50", "throughput": 5799.81, "total_tokens": 9990736} {"current_steps": 15330, "total_steps": 33920, "loss": 0.4524, "lr": 6.6786344071757795e-06, "epoch": 9.038915094339623, "percentage": 45.19, "elapsed_time": "0:28:43", "remaining_time": "0:34:49", "throughput": 5799.99, "total_tokens": 9994000} {"current_steps": 15335, "total_steps": 33920, "loss": 0.3168, "lr": 6.676210792899267e-06, "epoch": 9.04186320754717, "percentage": 45.21, "elapsed_time": "0:28:43", "remaining_time": "0:34:48", "throughput": 5799.78, "total_tokens": 9996272} {"current_steps": 15340, "total_steps": 33920, "loss": 0.3955, "lr": 6.6737867348387235e-06, "epoch": 9.044811320754716, "percentage": 45.22, "elapsed_time": "0:28:44", "remaining_time": "0:34:48", "throughput": 5799.92, "total_tokens": 9999632} {"current_steps": 15345, "total_steps": 33920, "loss": 0.3593, "lr": 6.671362233635926e-06, "epoch": 9.047759433962264, "percentage": 45.24, "elapsed_time": "0:28:44", "remaining_time": "0:34:47", "throughput": 5799.99, "total_tokens": 10002512} {"current_steps": 15350, "total_steps": 33920, "loss": 0.3448, "lr": 6.668937289932775e-06, "epoch": 9.05070754716981, "percentage": 45.25, "elapsed_time": "0:28:45", "remaining_time": "0:34:46", "throughput": 5799.87, "total_tokens": 10005136} {"current_steps": 15355, "total_steps": 33920, "loss": 0.2999, "lr": 6.666511904371285e-06, "epoch": 9.053655660377359, "percentage": 45.27, "elapsed_time": "0:28:45", "remaining_time": "0:34:46", "throughput": 5799.97, "total_tokens": 10008336} {"current_steps": 15360, "total_steps": 33920, "loss": 0.2692, "lr": 6.664086077593586e-06, "epoch": 9.056603773584905, "percentage": 45.28, "elapsed_time": "0:28:46", "remaining_time": "0:34:45", "throughput": 5800.04, "total_tokens": 10011248} {"current_steps": 15365, "total_steps": 33920, "loss": 0.5523, "lr": 6.661659810241924e-06, "epoch": 9.059551886792454, "percentage": 45.3, "elapsed_time": "0:28:46", "remaining_time": "0:34:45", "throughput": 5800.05, "total_tokens": 10014448} {"current_steps": 15370, "total_steps": 33920, "loss": 0.3496, "lr": 6.659233102958667e-06, "epoch": 9.0625, "percentage": 45.31, "elapsed_time": "0:28:47", "remaining_time": "0:34:44", "throughput": 5800.13, "total_tokens": 10017616} {"current_steps": 15375, "total_steps": 33920, "loss": 0.3469, "lr": 6.6568059563862965e-06, "epoch": 9.065448113207546, "percentage": 45.33, "elapsed_time": "0:28:47", "remaining_time": "0:34:43", "throughput": 5800.11, "total_tokens": 10020432} {"current_steps": 15380, "total_steps": 33920, "loss": 0.385, "lr": 6.654378371167407e-06, "epoch": 9.068396226415095, "percentage": 45.34, "elapsed_time": "0:28:48", "remaining_time": "0:34:43", "throughput": 5800.37, "total_tokens": 10024624} {"current_steps": 15385, "total_steps": 33920, "loss": 0.3473, "lr": 6.651950347944715e-06, "epoch": 9.071344339622641, "percentage": 45.36, "elapsed_time": "0:28:48", "remaining_time": "0:34:42", "throughput": 5800.73, "total_tokens": 10029040} {"current_steps": 15390, "total_steps": 33920, "loss": 0.3784, "lr": 6.649521887361048e-06, "epoch": 9.07429245283019, "percentage": 45.37, "elapsed_time": "0:28:49", "remaining_time": "0:34:42", "throughput": 5801.11, "total_tokens": 10034064} {"current_steps": 15395, "total_steps": 33920, "loss": 0.4726, "lr": 6.647092990059352e-06, "epoch": 9.077240566037736, "percentage": 45.39, "elapsed_time": "0:28:50", "remaining_time": "0:34:41", "throughput": 5801.14, "total_tokens": 10037200} {"current_steps": 15400, "total_steps": 33920, "loss": 0.4033, "lr": 6.644663656682689e-06, "epoch": 9.080188679245284, "percentage": 45.4, "elapsed_time": "0:28:50", "remaining_time": "0:34:41", "throughput": 5801.21, "total_tokens": 10040368} {"current_steps": 15405, "total_steps": 33920, "loss": 0.3821, "lr": 6.642233887874234e-06, "epoch": 9.08313679245283, "percentage": 45.42, "elapsed_time": "0:28:51", "remaining_time": "0:34:40", "throughput": 5801.36, "total_tokens": 10044208} {"current_steps": 15410, "total_steps": 33920, "loss": 0.4293, "lr": 6.639803684277279e-06, "epoch": 9.086084905660377, "percentage": 45.43, "elapsed_time": "0:28:51", "remaining_time": "0:34:40", "throughput": 5801.38, "total_tokens": 10047120} {"current_steps": 15415, "total_steps": 33920, "loss": 0.3601, "lr": 6.637373046535233e-06, "epoch": 9.089033018867925, "percentage": 45.45, "elapsed_time": "0:28:52", "remaining_time": "0:34:39", "throughput": 5801.39, "total_tokens": 10050288} {"current_steps": 15420, "total_steps": 33920, "loss": 0.4904, "lr": 6.634941975291617e-06, "epoch": 9.091981132075471, "percentage": 45.46, "elapsed_time": "0:28:53", "remaining_time": "0:34:39", "throughput": 5801.6, "total_tokens": 10054480} {"current_steps": 15425, "total_steps": 33920, "loss": 0.3969, "lr": 6.632510471190065e-06, "epoch": 9.09492924528302, "percentage": 45.47, "elapsed_time": "0:28:53", "remaining_time": "0:34:38", "throughput": 5801.6, "total_tokens": 10057616} {"current_steps": 15430, "total_steps": 33920, "loss": 0.3054, "lr": 6.630078534874332e-06, "epoch": 9.097877358490566, "percentage": 45.49, "elapsed_time": "0:28:54", "remaining_time": "0:34:37", "throughput": 5801.53, "total_tokens": 10060144} {"current_steps": 15435, "total_steps": 33920, "loss": 0.433, "lr": 6.62764616698828e-06, "epoch": 9.100825471698114, "percentage": 45.5, "elapsed_time": "0:28:54", "remaining_time": "0:34:37", "throughput": 5801.49, "total_tokens": 10062928} {"current_steps": 15440, "total_steps": 33920, "loss": 0.3988, "lr": 6.625213368175889e-06, "epoch": 9.10377358490566, "percentage": 45.52, "elapsed_time": "0:28:55", "remaining_time": "0:34:36", "throughput": 5801.55, "total_tokens": 10065840} {"current_steps": 15445, "total_steps": 33920, "loss": 0.3401, "lr": 6.622780139081256e-06, "epoch": 9.106721698113208, "percentage": 45.53, "elapsed_time": "0:28:55", "remaining_time": "0:34:36", "throughput": 5801.65, "total_tokens": 10068912} {"current_steps": 15450, "total_steps": 33920, "loss": 0.4874, "lr": 6.620346480348589e-06, "epoch": 9.109669811320755, "percentage": 45.55, "elapsed_time": "0:28:56", "remaining_time": "0:34:35", "throughput": 5801.55, "total_tokens": 10071728} {"current_steps": 15455, "total_steps": 33920, "loss": 0.3906, "lr": 6.617912392622206e-06, "epoch": 9.112617924528301, "percentage": 45.56, "elapsed_time": "0:28:56", "remaining_time": "0:34:34", "throughput": 5801.55, "total_tokens": 10074672} {"current_steps": 15460, "total_steps": 33920, "loss": 0.2949, "lr": 6.615477876546544e-06, "epoch": 9.11556603773585, "percentage": 45.58, "elapsed_time": "0:28:57", "remaining_time": "0:34:34", "throughput": 5801.76, "total_tokens": 10078160} {"current_steps": 15465, "total_steps": 33920, "loss": 0.3605, "lr": 6.6130429327661535e-06, "epoch": 9.118514150943396, "percentage": 45.59, "elapsed_time": "0:28:57", "remaining_time": "0:34:33", "throughput": 5801.75, "total_tokens": 10080912} {"current_steps": 15470, "total_steps": 33920, "loss": 0.3987, "lr": 6.610607561925694e-06, "epoch": 9.121462264150944, "percentage": 45.61, "elapsed_time": "0:28:58", "remaining_time": "0:34:32", "throughput": 5801.8, "total_tokens": 10084048} {"current_steps": 15475, "total_steps": 33920, "loss": 0.36, "lr": 6.608171764669941e-06, "epoch": 9.12441037735849, "percentage": 45.62, "elapsed_time": "0:28:58", "remaining_time": "0:34:32", "throughput": 5801.95, "total_tokens": 10087312} {"current_steps": 15480, "total_steps": 33920, "loss": 0.4232, "lr": 6.605735541643783e-06, "epoch": 9.127358490566039, "percentage": 45.64, "elapsed_time": "0:28:59", "remaining_time": "0:34:31", "throughput": 5802.22, "total_tokens": 10091184} {"current_steps": 15485, "total_steps": 33920, "loss": 0.3992, "lr": 6.603298893492219e-06, "epoch": 9.130306603773585, "percentage": 45.65, "elapsed_time": "0:28:59", "remaining_time": "0:34:31", "throughput": 5802.67, "total_tokens": 10096400} {"current_steps": 15490, "total_steps": 33920, "loss": 0.38, "lr": 6.6008618208603625e-06, "epoch": 9.133254716981131, "percentage": 45.67, "elapsed_time": "0:29:00", "remaining_time": "0:34:30", "throughput": 5802.67, "total_tokens": 10099216} {"current_steps": 15495, "total_steps": 33920, "loss": 0.3689, "lr": 6.598424324393442e-06, "epoch": 9.13620283018868, "percentage": 45.68, "elapsed_time": "0:29:00", "remaining_time": "0:34:30", "throughput": 5802.74, "total_tokens": 10102224} {"current_steps": 15500, "total_steps": 33920, "loss": 0.4944, "lr": 6.595986404736792e-06, "epoch": 9.139150943396226, "percentage": 45.7, "elapsed_time": "0:29:01", "remaining_time": "0:34:29", "throughput": 5802.97, "total_tokens": 10105904} {"current_steps": 15505, "total_steps": 33920, "loss": 0.3883, "lr": 6.5935480625358615e-06, "epoch": 9.142099056603774, "percentage": 45.71, "elapsed_time": "0:29:02", "remaining_time": "0:34:28", "throughput": 5803.05, "total_tokens": 10108976} {"current_steps": 15510, "total_steps": 33920, "loss": 0.3664, "lr": 6.591109298436216e-06, "epoch": 9.14504716981132, "percentage": 45.73, "elapsed_time": "0:29:02", "remaining_time": "0:34:28", "throughput": 5802.96, "total_tokens": 10112048} {"current_steps": 15515, "total_steps": 33920, "loss": 0.336, "lr": 6.5886701130835255e-06, "epoch": 9.147995283018869, "percentage": 45.74, "elapsed_time": "0:29:03", "remaining_time": "0:34:27", "throughput": 5803.07, "total_tokens": 10115344} {"current_steps": 15520, "total_steps": 33920, "loss": 0.2463, "lr": 6.586230507123574e-06, "epoch": 9.150943396226415, "percentage": 45.75, "elapsed_time": "0:29:03", "remaining_time": "0:34:27", "throughput": 5803.06, "total_tokens": 10118288} {"current_steps": 15525, "total_steps": 33920, "loss": 0.4199, "lr": 6.583790481202261e-06, "epoch": 9.153891509433961, "percentage": 45.77, "elapsed_time": "0:29:04", "remaining_time": "0:34:26", "throughput": 5803.21, "total_tokens": 10122000} {"current_steps": 15530, "total_steps": 33920, "loss": 0.4549, "lr": 6.5813500359655925e-06, "epoch": 9.15683962264151, "percentage": 45.78, "elapsed_time": "0:29:04", "remaining_time": "0:34:26", "throughput": 5803.18, "total_tokens": 10124976} {"current_steps": 15535, "total_steps": 33920, "loss": 0.3342, "lr": 6.578909172059687e-06, "epoch": 9.159787735849056, "percentage": 45.8, "elapsed_time": "0:29:05", "remaining_time": "0:34:25", "throughput": 5803.52, "total_tokens": 10129424} {"current_steps": 15540, "total_steps": 33920, "loss": 0.5142, "lr": 6.576467890130772e-06, "epoch": 9.162735849056604, "percentage": 45.81, "elapsed_time": "0:29:05", "remaining_time": "0:34:24", "throughput": 5803.54, "total_tokens": 10132336} {"current_steps": 15545, "total_steps": 33920, "loss": 0.3993, "lr": 6.574026190825191e-06, "epoch": 9.16568396226415, "percentage": 45.83, "elapsed_time": "0:29:06", "remaining_time": "0:34:24", "throughput": 5803.64, "total_tokens": 10135824} {"current_steps": 15550, "total_steps": 33920, "loss": 0.584, "lr": 6.57158407478939e-06, "epoch": 9.168632075471699, "percentage": 45.84, "elapsed_time": "0:29:06", "remaining_time": "0:34:23", "throughput": 5803.79, "total_tokens": 10139120} {"current_steps": 15555, "total_steps": 33920, "loss": 0.3488, "lr": 6.569141542669935e-06, "epoch": 9.171580188679245, "percentage": 45.86, "elapsed_time": "0:29:07", "remaining_time": "0:34:23", "throughput": 5803.64, "total_tokens": 10141584} {"current_steps": 15560, "total_steps": 33920, "loss": 0.4841, "lr": 6.566698595113492e-06, "epoch": 9.174528301886792, "percentage": 45.87, "elapsed_time": "0:29:07", "remaining_time": "0:34:22", "throughput": 5803.42, "total_tokens": 10144048} {"current_steps": 15565, "total_steps": 33920, "loss": 0.4002, "lr": 6.564255232766843e-06, "epoch": 9.17747641509434, "percentage": 45.89, "elapsed_time": "0:29:08", "remaining_time": "0:34:21", "throughput": 5803.63, "total_tokens": 10147568} {"current_steps": 15570, "total_steps": 33920, "loss": 0.3668, "lr": 6.561811456276881e-06, "epoch": 9.180424528301886, "percentage": 45.9, "elapsed_time": "0:29:09", "remaining_time": "0:34:21", "throughput": 5803.7, "total_tokens": 10151088} {"current_steps": 15575, "total_steps": 33920, "loss": 0.4924, "lr": 6.559367266290605e-06, "epoch": 9.183372641509434, "percentage": 45.92, "elapsed_time": "0:29:09", "remaining_time": "0:34:20", "throughput": 5803.85, "total_tokens": 10154352} {"current_steps": 15580, "total_steps": 33920, "loss": 0.4176, "lr": 6.556922663455123e-06, "epoch": 9.18632075471698, "percentage": 45.93, "elapsed_time": "0:29:10", "remaining_time": "0:34:20", "throughput": 5804.07, "total_tokens": 10157776} {"current_steps": 15585, "total_steps": 33920, "loss": 0.2943, "lr": 6.554477648417657e-06, "epoch": 9.189268867924529, "percentage": 45.95, "elapsed_time": "0:29:10", "remaining_time": "0:34:19", "throughput": 5803.99, "total_tokens": 10160528} {"current_steps": 15590, "total_steps": 33920, "loss": 0.439, "lr": 6.552032221825535e-06, "epoch": 9.192216981132075, "percentage": 45.96, "elapsed_time": "0:29:11", "remaining_time": "0:34:18", "throughput": 5804.22, "total_tokens": 10164080} {"current_steps": 15595, "total_steps": 33920, "loss": 0.3956, "lr": 6.549586384326192e-06, "epoch": 9.195165094339623, "percentage": 45.98, "elapsed_time": "0:29:11", "remaining_time": "0:34:18", "throughput": 5804.3, "total_tokens": 10167600} {"current_steps": 15600, "total_steps": 33920, "loss": 0.3982, "lr": 6.547140136567176e-06, "epoch": 9.19811320754717, "percentage": 45.99, "elapsed_time": "0:29:12", "remaining_time": "0:34:17", "throughput": 5804.32, "total_tokens": 10170512} {"current_steps": 15605, "total_steps": 33920, "loss": 0.3391, "lr": 6.544693479196142e-06, "epoch": 9.201061320754716, "percentage": 46.01, "elapsed_time": "0:29:12", "remaining_time": "0:34:17", "throughput": 5804.65, "total_tokens": 10174928} {"current_steps": 15610, "total_steps": 33920, "loss": 0.44, "lr": 6.542246412860851e-06, "epoch": 9.204009433962264, "percentage": 46.02, "elapsed_time": "0:29:13", "remaining_time": "0:34:16", "throughput": 5804.46, "total_tokens": 10177552} {"current_steps": 15615, "total_steps": 33920, "loss": 0.5209, "lr": 6.5397989382091754e-06, "epoch": 9.20695754716981, "percentage": 46.03, "elapsed_time": "0:29:14", "remaining_time": "0:34:16", "throughput": 5804.76, "total_tokens": 10181840} {"current_steps": 15620, "total_steps": 33920, "loss": 0.2597, "lr": 6.537351055889096e-06, "epoch": 9.209905660377359, "percentage": 46.05, "elapsed_time": "0:29:14", "remaining_time": "0:34:15", "throughput": 5804.83, "total_tokens": 10184880} {"current_steps": 15625, "total_steps": 33920, "loss": 0.3355, "lr": 6.534902766548698e-06, "epoch": 9.212853773584905, "percentage": 46.06, "elapsed_time": "0:29:15", "remaining_time": "0:34:14", "throughput": 5805.0, "total_tokens": 10188272} {"current_steps": 15630, "total_steps": 33920, "loss": 0.3663, "lr": 6.532454070836176e-06, "epoch": 9.215801886792454, "percentage": 46.08, "elapsed_time": "0:29:15", "remaining_time": "0:34:14", "throughput": 5804.87, "total_tokens": 10190704} {"current_steps": 15635, "total_steps": 33920, "loss": 0.3209, "lr": 6.530004969399836e-06, "epoch": 9.21875, "percentage": 46.09, "elapsed_time": "0:29:16", "remaining_time": "0:34:13", "throughput": 5805.06, "total_tokens": 10194096} {"current_steps": 15640, "total_steps": 33920, "loss": 0.2777, "lr": 6.5275554628880865e-06, "epoch": 9.221698113207546, "percentage": 46.11, "elapsed_time": "0:29:16", "remaining_time": "0:34:13", "throughput": 5805.15, "total_tokens": 10197616} {"current_steps": 15645, "total_steps": 33920, "loss": 0.4667, "lr": 6.525105551949444e-06, "epoch": 9.224646226415095, "percentage": 46.12, "elapsed_time": "0:29:17", "remaining_time": "0:34:12", "throughput": 5805.29, "total_tokens": 10201392} {"current_steps": 15650, "total_steps": 33920, "loss": 0.4882, "lr": 6.522655237232535e-06, "epoch": 9.227594339622641, "percentage": 46.14, "elapsed_time": "0:29:17", "remaining_time": "0:34:12", "throughput": 5805.29, "total_tokens": 10204304} {"current_steps": 15655, "total_steps": 33920, "loss": 0.3778, "lr": 6.5202045193860885e-06, "epoch": 9.23054245283019, "percentage": 46.15, "elapsed_time": "0:29:18", "remaining_time": "0:34:11", "throughput": 5805.31, "total_tokens": 10207280} {"current_steps": 15660, "total_steps": 33920, "loss": 0.3208, "lr": 6.517753399058944e-06, "epoch": 9.233490566037736, "percentage": 46.17, "elapsed_time": "0:29:18", "remaining_time": "0:34:10", "throughput": 5805.25, "total_tokens": 10209904} {"current_steps": 15665, "total_steps": 33920, "loss": 0.6337, "lr": 6.515301876900047e-06, "epoch": 9.236438679245284, "percentage": 46.18, "elapsed_time": "0:29:19", "remaining_time": "0:34:10", "throughput": 5805.38, "total_tokens": 10213360} {"current_steps": 15670, "total_steps": 33920, "loss": 0.4203, "lr": 6.512849953558445e-06, "epoch": 9.23938679245283, "percentage": 46.2, "elapsed_time": "0:29:19", "remaining_time": "0:34:09", "throughput": 5805.4, "total_tokens": 10216496} {"current_steps": 15675, "total_steps": 33920, "loss": 0.3568, "lr": 6.510397629683301e-06, "epoch": 9.242334905660377, "percentage": 46.21, "elapsed_time": "0:29:20", "remaining_time": "0:34:08", "throughput": 5805.6, "total_tokens": 10219984} {"current_steps": 15680, "total_steps": 33920, "loss": 0.3507, "lr": 6.507944905923872e-06, "epoch": 9.245283018867925, "percentage": 46.23, "elapsed_time": "0:29:20", "remaining_time": "0:34:08", "throughput": 5805.78, "total_tokens": 10223280} {"current_steps": 15685, "total_steps": 33920, "loss": 0.3952, "lr": 6.505491782929531e-06, "epoch": 9.248231132075471, "percentage": 46.24, "elapsed_time": "0:29:21", "remaining_time": "0:34:07", "throughput": 5805.87, "total_tokens": 10226640} {"current_steps": 15690, "total_steps": 33920, "loss": 0.3722, "lr": 6.5030382613497535e-06, "epoch": 9.25117924528302, "percentage": 46.26, "elapsed_time": "0:29:22", "remaining_time": "0:34:07", "throughput": 5806.04, "total_tokens": 10230288} {"current_steps": 15695, "total_steps": 33920, "loss": 0.4178, "lr": 6.500584341834119e-06, "epoch": 9.254127358490566, "percentage": 46.27, "elapsed_time": "0:29:22", "remaining_time": "0:34:06", "throughput": 5806.04, "total_tokens": 10233136} {"current_steps": 15700, "total_steps": 33920, "loss": 0.3248, "lr": 6.498130025032312e-06, "epoch": 9.257075471698114, "percentage": 46.29, "elapsed_time": "0:29:23", "remaining_time": "0:34:06", "throughput": 5805.81, "total_tokens": 10235792} {"current_steps": 15705, "total_steps": 33920, "loss": 0.3616, "lr": 6.495675311594123e-06, "epoch": 9.26002358490566, "percentage": 46.3, "elapsed_time": "0:29:23", "remaining_time": "0:34:05", "throughput": 5805.93, "total_tokens": 10239088} {"current_steps": 15710, "total_steps": 33920, "loss": 0.3967, "lr": 6.493220202169452e-06, "epoch": 9.262971698113208, "percentage": 46.31, "elapsed_time": "0:29:24", "remaining_time": "0:34:04", "throughput": 5806.1, "total_tokens": 10242320} {"current_steps": 15715, "total_steps": 33920, "loss": 0.3508, "lr": 6.490764697408295e-06, "epoch": 9.265919811320755, "percentage": 46.33, "elapsed_time": "0:29:24", "remaining_time": "0:34:04", "throughput": 5806.17, "total_tokens": 10246160} {"current_steps": 15720, "total_steps": 33920, "loss": 0.2591, "lr": 6.48830879796076e-06, "epoch": 9.268867924528301, "percentage": 46.34, "elapsed_time": "0:29:25", "remaining_time": "0:34:04", "throughput": 5806.64, "total_tokens": 10251632} {"current_steps": 15725, "total_steps": 33920, "loss": 0.385, "lr": 6.4858525044770546e-06, "epoch": 9.27181603773585, "percentage": 46.36, "elapsed_time": "0:29:25", "remaining_time": "0:34:03", "throughput": 5806.55, "total_tokens": 10254224} {"current_steps": 15730, "total_steps": 33920, "loss": 0.3786, "lr": 6.483395817607497e-06, "epoch": 9.274764150943396, "percentage": 46.37, "elapsed_time": "0:29:26", "remaining_time": "0:34:02", "throughput": 5806.5, "total_tokens": 10256976} {"current_steps": 15735, "total_steps": 33920, "loss": 0.3651, "lr": 6.480938738002504e-06, "epoch": 9.277712264150944, "percentage": 46.39, "elapsed_time": "0:29:27", "remaining_time": "0:34:02", "throughput": 5806.57, "total_tokens": 10260368} {"current_steps": 15740, "total_steps": 33920, "loss": 0.37, "lr": 6.478481266312597e-06, "epoch": 9.28066037735849, "percentage": 46.4, "elapsed_time": "0:29:27", "remaining_time": "0:34:01", "throughput": 5806.67, "total_tokens": 10263920} {"current_steps": 15745, "total_steps": 33920, "loss": 0.357, "lr": 6.476023403188403e-06, "epoch": 9.283608490566039, "percentage": 46.42, "elapsed_time": "0:29:28", "remaining_time": "0:34:01", "throughput": 5806.93, "total_tokens": 10268048} {"current_steps": 15750, "total_steps": 33920, "loss": 0.4381, "lr": 6.473565149280651e-06, "epoch": 9.286556603773585, "percentage": 46.43, "elapsed_time": "0:29:28", "remaining_time": "0:34:00", "throughput": 5807.01, "total_tokens": 10271280} {"current_steps": 15755, "total_steps": 33920, "loss": 0.4675, "lr": 6.471106505240175e-06, "epoch": 9.289504716981131, "percentage": 46.45, "elapsed_time": "0:29:29", "remaining_time": "0:33:59", "throughput": 5807.03, "total_tokens": 10274256} {"current_steps": 15760, "total_steps": 33920, "loss": 0.384, "lr": 6.468647471717914e-06, "epoch": 9.29245283018868, "percentage": 46.46, "elapsed_time": "0:29:29", "remaining_time": "0:33:59", "throughput": 5806.87, "total_tokens": 10276784} {"current_steps": 15765, "total_steps": 33920, "loss": 0.4048, "lr": 6.466188049364902e-06, "epoch": 9.295400943396226, "percentage": 46.48, "elapsed_time": "0:29:30", "remaining_time": "0:33:58", "throughput": 5806.39, "total_tokens": 10279024} {"current_steps": 15770, "total_steps": 33920, "loss": 0.4125, "lr": 6.463728238832288e-06, "epoch": 9.298349056603774, "percentage": 46.49, "elapsed_time": "0:29:30", "remaining_time": "0:33:58", "throughput": 5806.43, "total_tokens": 10282352} {"current_steps": 15775, "total_steps": 33920, "loss": 0.31, "lr": 6.461268040771311e-06, "epoch": 9.30129716981132, "percentage": 46.51, "elapsed_time": "0:29:31", "remaining_time": "0:33:57", "throughput": 5806.31, "total_tokens": 10285104} {"current_steps": 15780, "total_steps": 33920, "loss": 0.4125, "lr": 6.458807455833326e-06, "epoch": 9.304245283018869, "percentage": 46.52, "elapsed_time": "0:29:31", "remaining_time": "0:33:56", "throughput": 5806.15, "total_tokens": 10287824} {"current_steps": 15785, "total_steps": 33920, "loss": 0.4139, "lr": 6.456346484669778e-06, "epoch": 9.307193396226415, "percentage": 46.54, "elapsed_time": "0:29:32", "remaining_time": "0:33:56", "throughput": 5806.4, "total_tokens": 10292016} {"current_steps": 15790, "total_steps": 33920, "loss": 0.3732, "lr": 6.4538851279322225e-06, "epoch": 9.310141509433961, "percentage": 46.55, "elapsed_time": "0:29:33", "remaining_time": "0:33:55", "throughput": 5806.59, "total_tokens": 10295568} {"current_steps": 15795, "total_steps": 33920, "loss": 0.3142, "lr": 6.451423386272312e-06, "epoch": 9.31308962264151, "percentage": 46.57, "elapsed_time": "0:29:34", "remaining_time": "0:33:55", "throughput": 5806.98, "total_tokens": 10302928} {"current_steps": 15800, "total_steps": 33920, "loss": 0.4111, "lr": 6.448961260341806e-06, "epoch": 9.316037735849056, "percentage": 46.58, "elapsed_time": "0:29:34", "remaining_time": "0:33:55", "throughput": 5807.15, "total_tokens": 10306544} {"current_steps": 15805, "total_steps": 33920, "loss": 0.3325, "lr": 6.446498750792563e-06, "epoch": 9.318985849056604, "percentage": 46.59, "elapsed_time": "0:29:35", "remaining_time": "0:33:54", "throughput": 5807.16, "total_tokens": 10309424} {"current_steps": 15810, "total_steps": 33920, "loss": 0.3642, "lr": 6.444035858276538e-06, "epoch": 9.32193396226415, "percentage": 46.61, "elapsed_time": "0:29:35", "remaining_time": "0:33:54", "throughput": 5807.21, "total_tokens": 10312496} {"current_steps": 15815, "total_steps": 33920, "loss": 0.3718, "lr": 6.441572583445799e-06, "epoch": 9.324882075471699, "percentage": 46.62, "elapsed_time": "0:29:36", "remaining_time": "0:33:53", "throughput": 5807.13, "total_tokens": 10315376} {"current_steps": 15820, "total_steps": 33920, "loss": 0.3244, "lr": 6.439108926952504e-06, "epoch": 9.327830188679245, "percentage": 46.64, "elapsed_time": "0:29:36", "remaining_time": "0:33:52", "throughput": 5807.16, "total_tokens": 10318544} {"current_steps": 15825, "total_steps": 33920, "loss": 0.4835, "lr": 6.43664488944892e-06, "epoch": 9.330778301886792, "percentage": 46.65, "elapsed_time": "0:29:37", "remaining_time": "0:33:52", "throughput": 5807.29, "total_tokens": 10321904} {"current_steps": 15830, "total_steps": 33920, "loss": 0.3416, "lr": 6.434180471587409e-06, "epoch": 9.33372641509434, "percentage": 46.67, "elapsed_time": "0:29:37", "remaining_time": "0:33:51", "throughput": 5807.45, "total_tokens": 10325392} {"current_steps": 15835, "total_steps": 33920, "loss": 0.3338, "lr": 6.431715674020438e-06, "epoch": 9.336674528301886, "percentage": 46.68, "elapsed_time": "0:29:38", "remaining_time": "0:33:51", "throughput": 5807.47, "total_tokens": 10328304} {"current_steps": 15840, "total_steps": 33920, "loss": 0.4561, "lr": 6.429250497400571e-06, "epoch": 9.339622641509434, "percentage": 46.7, "elapsed_time": "0:29:39", "remaining_time": "0:33:50", "throughput": 5808.14, "total_tokens": 10334224} {"current_steps": 15845, "total_steps": 33920, "loss": 0.501, "lr": 6.426784942380475e-06, "epoch": 9.34257075471698, "percentage": 46.71, "elapsed_time": "0:29:39", "remaining_time": "0:33:50", "throughput": 5808.23, "total_tokens": 10337200} {"current_steps": 15850, "total_steps": 33920, "loss": 0.3969, "lr": 6.424319009612917e-06, "epoch": 9.345518867924529, "percentage": 46.73, "elapsed_time": "0:29:40", "remaining_time": "0:33:49", "throughput": 5808.33, "total_tokens": 10340560} {"current_steps": 15855, "total_steps": 33920, "loss": 0.3936, "lr": 6.421852699750763e-06, "epoch": 9.348466981132075, "percentage": 46.74, "elapsed_time": "0:29:40", "remaining_time": "0:33:49", "throughput": 5808.47, "total_tokens": 10343856} {"current_steps": 15860, "total_steps": 33920, "loss": 0.3257, "lr": 6.4193860134469775e-06, "epoch": 9.351415094339623, "percentage": 46.76, "elapsed_time": "0:29:41", "remaining_time": "0:33:48", "throughput": 5808.21, "total_tokens": 10346224} {"current_steps": 15865, "total_steps": 33920, "loss": 0.3133, "lr": 6.416918951354629e-06, "epoch": 9.35436320754717, "percentage": 46.77, "elapsed_time": "0:29:41", "remaining_time": "0:33:47", "throughput": 5808.21, "total_tokens": 10349296} {"current_steps": 15870, "total_steps": 33920, "loss": 0.2675, "lr": 6.4144515141268816e-06, "epoch": 9.357311320754716, "percentage": 46.79, "elapsed_time": "0:29:42", "remaining_time": "0:33:47", "throughput": 5808.18, "total_tokens": 10352176} {"current_steps": 15875, "total_steps": 33920, "loss": 0.3042, "lr": 6.411983702416999e-06, "epoch": 9.360259433962264, "percentage": 46.8, "elapsed_time": "0:29:42", "remaining_time": "0:33:46", "throughput": 5808.16, "total_tokens": 10355472} {"current_steps": 15880, "total_steps": 33920, "loss": 0.3803, "lr": 6.409515516878346e-06, "epoch": 9.36320754716981, "percentage": 46.82, "elapsed_time": "0:29:43", "remaining_time": "0:33:46", "throughput": 5808.14, "total_tokens": 10358608} {"current_steps": 15885, "total_steps": 33920, "loss": 0.4691, "lr": 6.407046958164387e-06, "epoch": 9.366155660377359, "percentage": 46.83, "elapsed_time": "0:29:43", "remaining_time": "0:33:45", "throughput": 5808.31, "total_tokens": 10362000} {"current_steps": 15890, "total_steps": 33920, "loss": 0.4357, "lr": 6.404578026928679e-06, "epoch": 9.369103773584905, "percentage": 46.85, "elapsed_time": "0:29:44", "remaining_time": "0:33:44", "throughput": 5808.29, "total_tokens": 10364784} {"current_steps": 15895, "total_steps": 33920, "loss": 0.4585, "lr": 6.402108723824887e-06, "epoch": 9.372051886792454, "percentage": 46.86, "elapsed_time": "0:29:45", "remaining_time": "0:33:44", "throughput": 5808.19, "total_tokens": 10367760} {"current_steps": 15900, "total_steps": 33920, "loss": 0.3507, "lr": 6.399639049506767e-06, "epoch": 9.375, "percentage": 46.88, "elapsed_time": "0:29:45", "remaining_time": "0:33:44", "throughput": 5808.76, "total_tokens": 10374096} {"current_steps": 15905, "total_steps": 33920, "loss": 0.4052, "lr": 6.397169004628177e-06, "epoch": 9.377948113207546, "percentage": 46.89, "elapsed_time": "0:29:46", "remaining_time": "0:33:43", "throughput": 5808.79, "total_tokens": 10377168} {"current_steps": 15910, "total_steps": 33920, "loss": 0.5029, "lr": 6.39469858984307e-06, "epoch": 9.380896226415095, "percentage": 46.9, "elapsed_time": "0:29:46", "remaining_time": "0:33:42", "throughput": 5808.93, "total_tokens": 10380400} {"current_steps": 15915, "total_steps": 33920, "loss": 0.3237, "lr": 6.3922278058055024e-06, "epoch": 9.383844339622641, "percentage": 46.92, "elapsed_time": "0:29:47", "remaining_time": "0:33:42", "throughput": 5808.94, "total_tokens": 10383248} {"current_steps": 15920, "total_steps": 33920, "loss": 0.3945, "lr": 6.389756653169622e-06, "epoch": 9.38679245283019, "percentage": 46.93, "elapsed_time": "0:29:47", "remaining_time": "0:33:41", "throughput": 5808.98, "total_tokens": 10386320} {"current_steps": 15925, "total_steps": 33920, "loss": 0.3749, "lr": 6.387285132589678e-06, "epoch": 9.389740566037736, "percentage": 46.95, "elapsed_time": "0:29:48", "remaining_time": "0:33:40", "throughput": 5809.07, "total_tokens": 10389424} {"current_steps": 15930, "total_steps": 33920, "loss": 0.3635, "lr": 6.3848132447200166e-06, "epoch": 9.392688679245284, "percentage": 46.96, "elapsed_time": "0:29:49", "remaining_time": "0:33:40", "throughput": 5809.28, "total_tokens": 10393072} {"current_steps": 15935, "total_steps": 33920, "loss": 0.3938, "lr": 6.38234099021508e-06, "epoch": 9.39563679245283, "percentage": 46.98, "elapsed_time": "0:29:49", "remaining_time": "0:33:39", "throughput": 5809.43, "total_tokens": 10396304} {"current_steps": 15940, "total_steps": 33920, "loss": 0.333, "lr": 6.379868369729409e-06, "epoch": 9.398584905660377, "percentage": 46.99, "elapsed_time": "0:29:50", "remaining_time": "0:33:39", "throughput": 5809.58, "total_tokens": 10399664} {"current_steps": 15945, "total_steps": 33920, "loss": 0.4399, "lr": 6.377395383917642e-06, "epoch": 9.401533018867925, "percentage": 47.01, "elapsed_time": "0:29:50", "remaining_time": "0:33:38", "throughput": 5809.66, "total_tokens": 10402896} {"current_steps": 15950, "total_steps": 33920, "loss": 0.3293, "lr": 6.374922033434507e-06, "epoch": 9.404481132075471, "percentage": 47.02, "elapsed_time": "0:29:51", "remaining_time": "0:33:37", "throughput": 5809.42, "total_tokens": 10405296} {"current_steps": 15955, "total_steps": 33920, "loss": 0.4693, "lr": 6.372448318934842e-06, "epoch": 9.40742924528302, "percentage": 47.04, "elapsed_time": "0:29:51", "remaining_time": "0:33:37", "throughput": 5809.58, "total_tokens": 10408496} {"current_steps": 15960, "total_steps": 33920, "loss": 0.3165, "lr": 6.369974241073569e-06, "epoch": 9.410377358490566, "percentage": 47.05, "elapsed_time": "0:29:52", "remaining_time": "0:33:36", "throughput": 5809.74, "total_tokens": 10411888} {"current_steps": 15965, "total_steps": 33920, "loss": 0.36, "lr": 6.367499800505709e-06, "epoch": 9.413325471698114, "percentage": 47.07, "elapsed_time": "0:29:52", "remaining_time": "0:33:36", "throughput": 5809.83, "total_tokens": 10415216} {"current_steps": 15970, "total_steps": 33920, "loss": 0.3442, "lr": 6.365024997886384e-06, "epoch": 9.41627358490566, "percentage": 47.08, "elapsed_time": "0:29:53", "remaining_time": "0:33:35", "throughput": 5809.88, "total_tokens": 10418288} {"current_steps": 15975, "total_steps": 33920, "loss": 0.3624, "lr": 6.362549833870808e-06, "epoch": 9.419221698113208, "percentage": 47.1, "elapsed_time": "0:29:53", "remaining_time": "0:33:34", "throughput": 5809.79, "total_tokens": 10420912} {"current_steps": 15980, "total_steps": 33920, "loss": 0.3843, "lr": 6.360074309114293e-06, "epoch": 9.422169811320755, "percentage": 47.11, "elapsed_time": "0:29:54", "remaining_time": "0:33:34", "throughput": 5809.7, "total_tokens": 10423408} {"current_steps": 15985, "total_steps": 33920, "loss": 0.3235, "lr": 6.357598424272241e-06, "epoch": 9.425117924528301, "percentage": 47.13, "elapsed_time": "0:29:54", "remaining_time": "0:33:33", "throughput": 5810.1, "total_tokens": 10427792} {"current_steps": 15990, "total_steps": 33920, "loss": 0.4691, "lr": 6.355122180000156e-06, "epoch": 9.42806603773585, "percentage": 47.14, "elapsed_time": "0:29:55", "remaining_time": "0:33:33", "throughput": 5810.07, "total_tokens": 10430928} {"current_steps": 15995, "total_steps": 33920, "loss": 0.4132, "lr": 6.352645576953635e-06, "epoch": 9.431014150943396, "percentage": 47.16, "elapsed_time": "0:29:55", "remaining_time": "0:33:32", "throughput": 5810.25, "total_tokens": 10434704} {"current_steps": 16000, "total_steps": 33920, "loss": 0.3727, "lr": 6.350168615788366e-06, "epoch": 9.433962264150944, "percentage": 47.17, "elapsed_time": "0:29:56", "remaining_time": "0:33:32", "throughput": 5810.44, "total_tokens": 10438096} {"current_steps": 16005, "total_steps": 33920, "loss": 0.3399, "lr": 6.347691297160137e-06, "epoch": 9.43691037735849, "percentage": 47.18, "elapsed_time": "0:29:57", "remaining_time": "0:33:31", "throughput": 5810.65, "total_tokens": 10441936} {"current_steps": 16010, "total_steps": 33920, "loss": 0.3689, "lr": 6.34521362172483e-06, "epoch": 9.439858490566039, "percentage": 47.2, "elapsed_time": "0:29:57", "remaining_time": "0:33:31", "throughput": 5810.53, "total_tokens": 10445552} {"current_steps": 16015, "total_steps": 33920, "loss": 0.3888, "lr": 6.342735590138417e-06, "epoch": 9.442806603773585, "percentage": 47.21, "elapsed_time": "0:29:58", "remaining_time": "0:33:30", "throughput": 5810.59, "total_tokens": 10448848} {"current_steps": 16020, "total_steps": 33920, "loss": 0.4097, "lr": 6.340257203056972e-06, "epoch": 9.445754716981131, "percentage": 47.23, "elapsed_time": "0:29:58", "remaining_time": "0:33:29", "throughput": 5810.61, "total_tokens": 10452592} {"current_steps": 16025, "total_steps": 33920, "loss": 0.439, "lr": 6.3377784611366554e-06, "epoch": 9.44870283018868, "percentage": 47.24, "elapsed_time": "0:29:59", "remaining_time": "0:33:29", "throughput": 5810.79, "total_tokens": 10456272} {"current_steps": 16030, "total_steps": 33920, "loss": 0.4599, "lr": 6.335299365033726e-06, "epoch": 9.451650943396226, "percentage": 47.26, "elapsed_time": "0:30:00", "remaining_time": "0:33:28", "throughput": 5811.09, "total_tokens": 10460080} {"current_steps": 16035, "total_steps": 33920, "loss": 0.3853, "lr": 6.3328199154045346e-06, "epoch": 9.454599056603774, "percentage": 47.27, "elapsed_time": "0:30:00", "remaining_time": "0:33:28", "throughput": 5811.17, "total_tokens": 10463248} {"current_steps": 16040, "total_steps": 33920, "loss": 0.4637, "lr": 6.3303401129055265e-06, "epoch": 9.45754716981132, "percentage": 47.29, "elapsed_time": "0:30:01", "remaining_time": "0:33:27", "throughput": 5811.3, "total_tokens": 10466896} {"current_steps": 16045, "total_steps": 33920, "loss": 0.3629, "lr": 6.32785995819324e-06, "epoch": 9.460495283018869, "percentage": 47.3, "elapsed_time": "0:30:01", "remaining_time": "0:33:27", "throughput": 5811.46, "total_tokens": 10470128} {"current_steps": 16050, "total_steps": 33920, "loss": 0.4269, "lr": 6.3253794519243075e-06, "epoch": 9.463443396226415, "percentage": 47.32, "elapsed_time": "0:30:02", "remaining_time": "0:33:26", "throughput": 5811.55, "total_tokens": 10473840} {"current_steps": 16055, "total_steps": 33920, "loss": 0.3994, "lr": 6.322898594755452e-06, "epoch": 9.466391509433961, "percentage": 47.33, "elapsed_time": "0:30:02", "remaining_time": "0:33:26", "throughput": 5811.72, "total_tokens": 10477424} {"current_steps": 16060, "total_steps": 33920, "loss": 0.3488, "lr": 6.320417387343492e-06, "epoch": 9.46933962264151, "percentage": 47.35, "elapsed_time": "0:30:03", "remaining_time": "0:33:25", "throughput": 5811.76, "total_tokens": 10480688} {"current_steps": 16065, "total_steps": 33920, "loss": 0.357, "lr": 6.3179358303453386e-06, "epoch": 9.472287735849056, "percentage": 47.36, "elapsed_time": "0:30:03", "remaining_time": "0:33:24", "throughput": 5812.02, "total_tokens": 10484720} {"current_steps": 16070, "total_steps": 33920, "loss": 0.3579, "lr": 6.315453924417995e-06, "epoch": 9.475235849056604, "percentage": 47.38, "elapsed_time": "0:30:04", "remaining_time": "0:33:24", "throughput": 5812.16, "total_tokens": 10487952} {"current_steps": 16075, "total_steps": 33920, "loss": 0.3065, "lr": 6.312971670218554e-06, "epoch": 9.47818396226415, "percentage": 47.39, "elapsed_time": "0:30:05", "remaining_time": "0:33:23", "throughput": 5812.37, "total_tokens": 10491664} {"current_steps": 16080, "total_steps": 33920, "loss": 0.4577, "lr": 6.3104890684042055e-06, "epoch": 9.481132075471699, "percentage": 47.41, "elapsed_time": "0:30:05", "remaining_time": "0:33:23", "throughput": 5812.39, "total_tokens": 10494416} {"current_steps": 16085, "total_steps": 33920, "loss": 0.3334, "lr": 6.308006119632228e-06, "epoch": 9.484080188679245, "percentage": 47.42, "elapsed_time": "0:30:05", "remaining_time": "0:33:22", "throughput": 5812.2, "total_tokens": 10496816} {"current_steps": 16090, "total_steps": 33920, "loss": 0.3879, "lr": 6.305522824559993e-06, "epoch": 9.487028301886792, "percentage": 47.44, "elapsed_time": "0:30:06", "remaining_time": "0:33:21", "throughput": 5812.34, "total_tokens": 10500304} {"current_steps": 16095, "total_steps": 33920, "loss": 0.4932, "lr": 6.303039183844965e-06, "epoch": 9.48997641509434, "percentage": 47.45, "elapsed_time": "0:30:07", "remaining_time": "0:33:21", "throughput": 5812.25, "total_tokens": 10502992} {"current_steps": 16100, "total_steps": 33920, "loss": 0.4101, "lr": 6.300555198144697e-06, "epoch": 9.492924528301886, "percentage": 47.46, "elapsed_time": "0:30:07", "remaining_time": "0:33:20", "throughput": 5811.99, "total_tokens": 10505200} {"current_steps": 16105, "total_steps": 33920, "loss": 0.4393, "lr": 6.2980708681168335e-06, "epoch": 9.495872641509434, "percentage": 47.48, "elapsed_time": "0:30:08", "remaining_time": "0:33:19", "throughput": 5812.03, "total_tokens": 10508176} {"current_steps": 16110, "total_steps": 33920, "loss": 0.3644, "lr": 6.2955861944191145e-06, "epoch": 9.49882075471698, "percentage": 47.49, "elapsed_time": "0:30:08", "remaining_time": "0:33:19", "throughput": 5811.97, "total_tokens": 10510928} {"current_steps": 16115, "total_steps": 33920, "loss": 0.4075, "lr": 6.293101177709367e-06, "epoch": 9.501768867924529, "percentage": 47.51, "elapsed_time": "0:30:09", "remaining_time": "0:33:18", "throughput": 5812.05, "total_tokens": 10514000} {"current_steps": 16120, "total_steps": 33920, "loss": 0.3591, "lr": 6.290615818645509e-06, "epoch": 9.504716981132075, "percentage": 47.52, "elapsed_time": "0:30:09", "remaining_time": "0:33:18", "throughput": 5812.13, "total_tokens": 10517392} {"current_steps": 16125, "total_steps": 33920, "loss": 0.4013, "lr": 6.288130117885552e-06, "epoch": 9.507665094339622, "percentage": 47.54, "elapsed_time": "0:30:10", "remaining_time": "0:33:17", "throughput": 5812.31, "total_tokens": 10520688} {"current_steps": 16130, "total_steps": 33920, "loss": 0.3585, "lr": 6.285644076087594e-06, "epoch": 9.51061320754717, "percentage": 47.55, "elapsed_time": "0:30:10", "remaining_time": "0:33:16", "throughput": 5812.26, "total_tokens": 10523280} {"current_steps": 16135, "total_steps": 33920, "loss": 0.3922, "lr": 6.283157693909826e-06, "epoch": 9.513561320754716, "percentage": 47.57, "elapsed_time": "0:30:11", "remaining_time": "0:33:16", "throughput": 5812.47, "total_tokens": 10526928} {"current_steps": 16140, "total_steps": 33920, "loss": 0.2761, "lr": 6.280670972010528e-06, "epoch": 9.516509433962264, "percentage": 47.58, "elapsed_time": "0:30:11", "remaining_time": "0:33:15", "throughput": 5812.6, "total_tokens": 10529968} {"current_steps": 16145, "total_steps": 33920, "loss": 0.3571, "lr": 6.278183911048072e-06, "epoch": 9.51945754716981, "percentage": 47.6, "elapsed_time": "0:30:12", "remaining_time": "0:33:15", "throughput": 5812.69, "total_tokens": 10533200} {"current_steps": 16150, "total_steps": 33920, "loss": 0.3913, "lr": 6.275696511680915e-06, "epoch": 9.522405660377359, "percentage": 47.61, "elapsed_time": "0:30:12", "remaining_time": "0:33:14", "throughput": 5812.75, "total_tokens": 10536048} {"current_steps": 16155, "total_steps": 33920, "loss": 0.506, "lr": 6.27320877456761e-06, "epoch": 9.525353773584905, "percentage": 47.63, "elapsed_time": "0:30:13", "remaining_time": "0:33:13", "throughput": 5813.02, "total_tokens": 10539760} {"current_steps": 16160, "total_steps": 33920, "loss": 0.6174, "lr": 6.270720700366793e-06, "epoch": 9.528301886792454, "percentage": 47.64, "elapsed_time": "0:30:13", "remaining_time": "0:33:13", "throughput": 5813.36, "total_tokens": 10544016} {"current_steps": 16165, "total_steps": 33920, "loss": 0.4251, "lr": 6.2682322897371974e-06, "epoch": 9.53125, "percentage": 47.66, "elapsed_time": "0:30:14", "remaining_time": "0:33:12", "throughput": 5813.7, "total_tokens": 10547984} {"current_steps": 16170, "total_steps": 33920, "loss": 0.3509, "lr": 6.265743543337634e-06, "epoch": 9.534198113207546, "percentage": 47.67, "elapsed_time": "0:30:14", "remaining_time": "0:33:12", "throughput": 5813.87, "total_tokens": 10551568} {"current_steps": 16175, "total_steps": 33920, "loss": 0.2753, "lr": 6.2632544618270156e-06, "epoch": 9.537146226415095, "percentage": 47.69, "elapsed_time": "0:30:15", "remaining_time": "0:33:11", "throughput": 5814.01, "total_tokens": 10554608} {"current_steps": 16180, "total_steps": 33920, "loss": 0.4476, "lr": 6.260765045864332e-06, "epoch": 9.540094339622641, "percentage": 47.7, "elapsed_time": "0:30:15", "remaining_time": "0:33:10", "throughput": 5814.24, "total_tokens": 10558160} {"current_steps": 16185, "total_steps": 33920, "loss": 0.4223, "lr": 6.258275296108669e-06, "epoch": 9.54304245283019, "percentage": 47.72, "elapsed_time": "0:30:16", "remaining_time": "0:33:10", "throughput": 5814.21, "total_tokens": 10560720} {"current_steps": 16190, "total_steps": 33920, "loss": 0.4747, "lr": 6.2557852132191985e-06, "epoch": 9.545990566037736, "percentage": 47.73, "elapsed_time": "0:30:16", "remaining_time": "0:33:09", "throughput": 5814.53, "total_tokens": 10564752} {"current_steps": 16195, "total_steps": 33920, "loss": 0.3604, "lr": 6.253294797855182e-06, "epoch": 9.548938679245284, "percentage": 47.74, "elapsed_time": "0:30:17", "remaining_time": "0:33:09", "throughput": 5814.5, "total_tokens": 10567600} {"current_steps": 16200, "total_steps": 33920, "loss": 0.4247, "lr": 6.250804050675964e-06, "epoch": 9.55188679245283, "percentage": 47.76, "elapsed_time": "0:30:18", "remaining_time": "0:33:08", "throughput": 5814.68, "total_tokens": 10571280} {"current_steps": 16205, "total_steps": 33920, "loss": 0.4556, "lr": 6.248312972340984e-06, "epoch": 9.554834905660378, "percentage": 47.77, "elapsed_time": "0:30:18", "remaining_time": "0:33:08", "throughput": 5814.93, "total_tokens": 10574928} {"current_steps": 16210, "total_steps": 33920, "loss": 0.5248, "lr": 6.2458215635097656e-06, "epoch": 9.557783018867925, "percentage": 47.79, "elapsed_time": "0:30:19", "remaining_time": "0:33:07", "throughput": 5815.19, "total_tokens": 10578864} {"current_steps": 16215, "total_steps": 33920, "loss": 0.3577, "lr": 6.2433298248419175e-06, "epoch": 9.560731132075471, "percentage": 47.8, "elapsed_time": "0:30:19", "remaining_time": "0:33:06", "throughput": 5815.2, "total_tokens": 10581648} {"current_steps": 16220, "total_steps": 33920, "loss": 0.3685, "lr": 6.2408377569971405e-06, "epoch": 9.56367924528302, "percentage": 47.82, "elapsed_time": "0:30:20", "remaining_time": "0:33:06", "throughput": 5815.35, "total_tokens": 10585424} {"current_steps": 16225, "total_steps": 33920, "loss": 0.4587, "lr": 6.238345360635221e-06, "epoch": 9.566627358490566, "percentage": 47.83, "elapsed_time": "0:30:20", "remaining_time": "0:33:05", "throughput": 5815.16, "total_tokens": 10587856} {"current_steps": 16230, "total_steps": 33920, "loss": 0.4316, "lr": 6.2358526364160274e-06, "epoch": 9.569575471698114, "percentage": 47.85, "elapsed_time": "0:30:21", "remaining_time": "0:33:05", "throughput": 5815.26, "total_tokens": 10591536} {"current_steps": 16235, "total_steps": 33920, "loss": 0.338, "lr": 6.2333595849995245e-06, "epoch": 9.57252358490566, "percentage": 47.86, "elapsed_time": "0:30:21", "remaining_time": "0:33:04", "throughput": 5815.43, "total_tokens": 10594768} {"current_steps": 16240, "total_steps": 33920, "loss": 0.3746, "lr": 6.230866207045756e-06, "epoch": 9.575471698113208, "percentage": 47.88, "elapsed_time": "0:30:22", "remaining_time": "0:33:03", "throughput": 5815.69, "total_tokens": 10598384} {"current_steps": 16245, "total_steps": 33920, "loss": 0.2456, "lr": 6.228372503214853e-06, "epoch": 9.578419811320755, "percentage": 47.89, "elapsed_time": "0:30:22", "remaining_time": "0:33:03", "throughput": 5815.86, "total_tokens": 10601776} {"current_steps": 16250, "total_steps": 33920, "loss": 0.6167, "lr": 6.225878474167035e-06, "epoch": 9.581367924528301, "percentage": 47.91, "elapsed_time": "0:30:23", "remaining_time": "0:33:03", "throughput": 5816.22, "total_tokens": 10607760} {"current_steps": 16255, "total_steps": 33920, "loss": 0.6155, "lr": 6.22338412056261e-06, "epoch": 9.58431603773585, "percentage": 47.92, "elapsed_time": "0:30:24", "remaining_time": "0:33:02", "throughput": 5816.27, "total_tokens": 10610832} {"current_steps": 16260, "total_steps": 33920, "loss": 0.3425, "lr": 6.220889443061966e-06, "epoch": 9.587264150943396, "percentage": 47.94, "elapsed_time": "0:30:24", "remaining_time": "0:33:01", "throughput": 5816.45, "total_tokens": 10614192} {"current_steps": 16265, "total_steps": 33920, "loss": 0.4821, "lr": 6.2183944423255796e-06, "epoch": 9.590212264150944, "percentage": 47.95, "elapsed_time": "0:30:25", "remaining_time": "0:33:01", "throughput": 5816.39, "total_tokens": 10616848} {"current_steps": 16270, "total_steps": 33920, "loss": 0.3529, "lr": 6.215899119014015e-06, "epoch": 9.59316037735849, "percentage": 47.97, "elapsed_time": "0:30:25", "remaining_time": "0:33:00", "throughput": 5816.45, "total_tokens": 10620144} {"current_steps": 16275, "total_steps": 33920, "loss": 0.3387, "lr": 6.2134034737879175e-06, "epoch": 9.596108490566039, "percentage": 47.98, "elapsed_time": "0:30:26", "remaining_time": "0:33:00", "throughput": 5816.4, "total_tokens": 10622832} {"current_steps": 16280, "total_steps": 33920, "loss": 0.4255, "lr": 6.2109075073080205e-06, "epoch": 9.599056603773585, "percentage": 48.0, "elapsed_time": "0:30:26", "remaining_time": "0:32:59", "throughput": 5816.39, "total_tokens": 10625552} {"current_steps": 16285, "total_steps": 33920, "loss": 0.3471, "lr": 6.2084112202351425e-06, "epoch": 9.602004716981131, "percentage": 48.01, "elapsed_time": "0:30:27", "remaining_time": "0:32:58", "throughput": 5816.42, "total_tokens": 10628368} {"current_steps": 16290, "total_steps": 33920, "loss": 0.3244, "lr": 6.205914613230186e-06, "epoch": 9.60495283018868, "percentage": 48.02, "elapsed_time": "0:30:27", "remaining_time": "0:32:58", "throughput": 5816.51, "total_tokens": 10631920} {"current_steps": 16295, "total_steps": 33920, "loss": 0.3593, "lr": 6.203417686954138e-06, "epoch": 9.607900943396226, "percentage": 48.04, "elapsed_time": "0:30:28", "remaining_time": "0:32:57", "throughput": 5816.59, "total_tokens": 10635152} {"current_steps": 16300, "total_steps": 33920, "loss": 0.3664, "lr": 6.2009204420680706e-06, "epoch": 9.610849056603774, "percentage": 48.05, "elapsed_time": "0:30:28", "remaining_time": "0:32:57", "throughput": 5816.59, "total_tokens": 10638096} {"current_steps": 16305, "total_steps": 33920, "loss": 0.4008, "lr": 6.198422879233141e-06, "epoch": 9.61379716981132, "percentage": 48.07, "elapsed_time": "0:30:29", "remaining_time": "0:32:56", "throughput": 5816.65, "total_tokens": 10641136} {"current_steps": 16310, "total_steps": 33920, "loss": 0.4521, "lr": 6.1959249991105895e-06, "epoch": 9.616745283018869, "percentage": 48.08, "elapsed_time": "0:30:29", "remaining_time": "0:32:55", "throughput": 5816.71, "total_tokens": 10644176} {"current_steps": 16315, "total_steps": 33920, "loss": 0.3356, "lr": 6.19342680236174e-06, "epoch": 9.619693396226415, "percentage": 48.1, "elapsed_time": "0:30:30", "remaining_time": "0:32:55", "throughput": 5816.45, "total_tokens": 10646608} {"current_steps": 16320, "total_steps": 33920, "loss": 0.4796, "lr": 6.190928289648003e-06, "epoch": 9.622641509433961, "percentage": 48.11, "elapsed_time": "0:30:31", "remaining_time": "0:32:54", "throughput": 5816.75, "total_tokens": 10650672} {"current_steps": 16325, "total_steps": 33920, "loss": 0.3043, "lr": 6.188429461630866e-06, "epoch": 9.62558962264151, "percentage": 48.13, "elapsed_time": "0:30:31", "remaining_time": "0:32:54", "throughput": 5816.75, "total_tokens": 10653680} {"current_steps": 16330, "total_steps": 33920, "loss": 0.3331, "lr": 6.185930318971909e-06, "epoch": 9.628537735849056, "percentage": 48.14, "elapsed_time": "0:30:32", "remaining_time": "0:32:53", "throughput": 5816.83, "total_tokens": 10656976} {"current_steps": 16335, "total_steps": 33920, "loss": 0.441, "lr": 6.1834308623327885e-06, "epoch": 9.631485849056604, "percentage": 48.16, "elapsed_time": "0:30:32", "remaining_time": "0:32:52", "throughput": 5816.81, "total_tokens": 10659664} {"current_steps": 16340, "total_steps": 33920, "loss": 0.3928, "lr": 6.180931092375247e-06, "epoch": 9.63443396226415, "percentage": 48.17, "elapsed_time": "0:30:33", "remaining_time": "0:32:52", "throughput": 5817.06, "total_tokens": 10663792} {"current_steps": 16345, "total_steps": 33920, "loss": 0.3496, "lr": 6.1784310097611075e-06, "epoch": 9.637382075471699, "percentage": 48.19, "elapsed_time": "0:30:33", "remaining_time": "0:32:51", "throughput": 5816.91, "total_tokens": 10666160} {"current_steps": 16350, "total_steps": 33920, "loss": 0.345, "lr": 6.1759306151522815e-06, "epoch": 9.640330188679245, "percentage": 48.2, "elapsed_time": "0:30:34", "remaining_time": "0:32:50", "throughput": 5816.9, "total_tokens": 10668976} {"current_steps": 16355, "total_steps": 33920, "loss": 0.2711, "lr": 6.173429909210755e-06, "epoch": 9.643278301886792, "percentage": 48.22, "elapsed_time": "0:30:34", "remaining_time": "0:32:50", "throughput": 5817.14, "total_tokens": 10672784} {"current_steps": 16360, "total_steps": 33920, "loss": 0.4054, "lr": 6.170928892598606e-06, "epoch": 9.64622641509434, "percentage": 48.23, "elapsed_time": "0:30:35", "remaining_time": "0:32:49", "throughput": 5817.36, "total_tokens": 10676336} {"current_steps": 16365, "total_steps": 33920, "loss": 0.3172, "lr": 6.168427565977984e-06, "epoch": 9.649174528301886, "percentage": 48.25, "elapsed_time": "0:30:35", "remaining_time": "0:32:49", "throughput": 5817.36, "total_tokens": 10679344} {"current_steps": 16370, "total_steps": 33920, "loss": 0.3845, "lr": 6.165925930011129e-06, "epoch": 9.652122641509434, "percentage": 48.26, "elapsed_time": "0:30:36", "remaining_time": "0:32:48", "throughput": 5817.32, "total_tokens": 10682416} {"current_steps": 16375, "total_steps": 33920, "loss": 0.4313, "lr": 6.163423985360359e-06, "epoch": 9.65507075471698, "percentage": 48.28, "elapsed_time": "0:30:36", "remaining_time": "0:32:48", "throughput": 5817.48, "total_tokens": 10685616} {"current_steps": 16380, "total_steps": 33920, "loss": 0.3738, "lr": 6.160921732688076e-06, "epoch": 9.658018867924529, "percentage": 48.29, "elapsed_time": "0:30:37", "remaining_time": "0:32:47", "throughput": 5817.64, "total_tokens": 10688848} {"current_steps": 16385, "total_steps": 33920, "loss": 0.5055, "lr": 6.158419172656759e-06, "epoch": 9.660966981132075, "percentage": 48.3, "elapsed_time": "0:30:37", "remaining_time": "0:32:46", "throughput": 5817.72, "total_tokens": 10692048} {"current_steps": 16390, "total_steps": 33920, "loss": 0.4606, "lr": 6.155916305928974e-06, "epoch": 9.663915094339622, "percentage": 48.32, "elapsed_time": "0:30:38", "remaining_time": "0:32:46", "throughput": 5817.78, "total_tokens": 10695472} {"current_steps": 16395, "total_steps": 33920, "loss": 0.3599, "lr": 6.153413133167366e-06, "epoch": 9.66686320754717, "percentage": 48.33, "elapsed_time": "0:30:38", "remaining_time": "0:32:45", "throughput": 5817.88, "total_tokens": 10698768} {"current_steps": 16400, "total_steps": 33920, "loss": 0.3355, "lr": 6.1509096550346596e-06, "epoch": 9.669811320754716, "percentage": 48.35, "elapsed_time": "0:30:39", "remaining_time": "0:32:45", "throughput": 5818.09, "total_tokens": 10702288} {"current_steps": 16405, "total_steps": 33920, "loss": 0.4104, "lr": 6.148405872193661e-06, "epoch": 9.672759433962264, "percentage": 48.36, "elapsed_time": "0:30:40", "remaining_time": "0:32:44", "throughput": 5818.3, "total_tokens": 10706096} {"current_steps": 16410, "total_steps": 33920, "loss": 0.433, "lr": 6.14590178530726e-06, "epoch": 9.67570754716981, "percentage": 48.38, "elapsed_time": "0:30:40", "remaining_time": "0:32:43", "throughput": 5818.43, "total_tokens": 10709392} {"current_steps": 16415, "total_steps": 33920, "loss": 0.3584, "lr": 6.143397395038422e-06, "epoch": 9.678655660377359, "percentage": 48.39, "elapsed_time": "0:30:41", "remaining_time": "0:32:43", "throughput": 5818.68, "total_tokens": 10713360} {"current_steps": 16420, "total_steps": 33920, "loss": 0.4353, "lr": 6.140892702050196e-06, "epoch": 9.681603773584905, "percentage": 48.41, "elapsed_time": "0:30:41", "remaining_time": "0:32:42", "throughput": 5818.75, "total_tokens": 10716464} {"current_steps": 16425, "total_steps": 33920, "loss": 0.4035, "lr": 6.138387707005711e-06, "epoch": 9.684551886792454, "percentage": 48.42, "elapsed_time": "0:30:42", "remaining_time": "0:32:42", "throughput": 5818.88, "total_tokens": 10719824} {"current_steps": 16430, "total_steps": 33920, "loss": 0.4111, "lr": 6.135882410568172e-06, "epoch": 9.6875, "percentage": 48.44, "elapsed_time": "0:30:42", "remaining_time": "0:32:41", "throughput": 5818.85, "total_tokens": 10722768} {"current_steps": 16435, "total_steps": 33920, "loss": 0.4062, "lr": 6.133376813400872e-06, "epoch": 9.690448113207546, "percentage": 48.45, "elapsed_time": "0:30:43", "remaining_time": "0:32:40", "throughput": 5818.55, "total_tokens": 10724944} {"current_steps": 16440, "total_steps": 33920, "loss": 0.4833, "lr": 6.130870916167175e-06, "epoch": 9.693396226415095, "percentage": 48.47, "elapsed_time": "0:30:43", "remaining_time": "0:32:40", "throughput": 5818.59, "total_tokens": 10728048} {"current_steps": 16445, "total_steps": 33920, "loss": 0.5316, "lr": 6.128364719530528e-06, "epoch": 9.696344339622641, "percentage": 48.48, "elapsed_time": "0:30:44", "remaining_time": "0:32:39", "throughput": 5818.56, "total_tokens": 10730768} {"current_steps": 16450, "total_steps": 33920, "loss": 0.4095, "lr": 6.125858224154459e-06, "epoch": 9.69929245283019, "percentage": 48.5, "elapsed_time": "0:30:44", "remaining_time": "0:32:39", "throughput": 5818.71, "total_tokens": 10734000} {"current_steps": 16455, "total_steps": 33920, "loss": 0.3504, "lr": 6.123351430702576e-06, "epoch": 9.702240566037736, "percentage": 48.51, "elapsed_time": "0:30:45", "remaining_time": "0:32:38", "throughput": 5818.65, "total_tokens": 10736592} {"current_steps": 16460, "total_steps": 33920, "loss": 0.294, "lr": 6.1208443398385575e-06, "epoch": 9.705188679245284, "percentage": 48.53, "elapsed_time": "0:30:45", "remaining_time": "0:32:37", "throughput": 5818.78, "total_tokens": 10739888} {"current_steps": 16465, "total_steps": 33920, "loss": 0.5239, "lr": 6.118336952226169e-06, "epoch": 9.70813679245283, "percentage": 48.54, "elapsed_time": "0:30:46", "remaining_time": "0:32:37", "throughput": 5819.09, "total_tokens": 10743984} {"current_steps": 16470, "total_steps": 33920, "loss": 0.3339, "lr": 6.115829268529254e-06, "epoch": 9.711084905660378, "percentage": 48.56, "elapsed_time": "0:30:46", "remaining_time": "0:32:36", "throughput": 5819.42, "total_tokens": 10747792} {"current_steps": 16475, "total_steps": 33920, "loss": 0.3415, "lr": 6.1133212894117326e-06, "epoch": 9.714033018867925, "percentage": 48.57, "elapsed_time": "0:30:47", "remaining_time": "0:32:36", "throughput": 5819.55, "total_tokens": 10751152} {"current_steps": 16480, "total_steps": 33920, "loss": 0.4803, "lr": 6.1108130155375986e-06, "epoch": 9.716981132075471, "percentage": 48.58, "elapsed_time": "0:30:47", "remaining_time": "0:32:35", "throughput": 5819.64, "total_tokens": 10754192} {"current_steps": 16485, "total_steps": 33920, "loss": 0.3669, "lr": 6.108304447570933e-06, "epoch": 9.71992924528302, "percentage": 48.6, "elapsed_time": "0:30:48", "remaining_time": "0:32:34", "throughput": 5819.83, "total_tokens": 10757584} {"current_steps": 16490, "total_steps": 33920, "loss": 0.454, "lr": 6.105795586175888e-06, "epoch": 9.722877358490566, "percentage": 48.61, "elapsed_time": "0:30:48", "remaining_time": "0:32:34", "throughput": 5819.94, "total_tokens": 10760816} {"current_steps": 16495, "total_steps": 33920, "loss": 0.4062, "lr": 6.1032864320166954e-06, "epoch": 9.725825471698114, "percentage": 48.63, "elapsed_time": "0:30:49", "remaining_time": "0:32:33", "throughput": 5820.2, "total_tokens": 10764880} {"current_steps": 16500, "total_steps": 33920, "loss": 0.358, "lr": 6.100776985757666e-06, "epoch": 9.72877358490566, "percentage": 48.64, "elapsed_time": "0:30:50", "remaining_time": "0:32:33", "throughput": 5820.08, "total_tokens": 10767632} {"current_steps": 16505, "total_steps": 33920, "loss": 0.4597, "lr": 6.098267248063186e-06, "epoch": 9.731721698113208, "percentage": 48.66, "elapsed_time": "0:30:50", "remaining_time": "0:32:32", "throughput": 5819.99, "total_tokens": 10770288} {"current_steps": 16510, "total_steps": 33920, "loss": 0.4452, "lr": 6.0957572195977165e-06, "epoch": 9.734669811320755, "percentage": 48.67, "elapsed_time": "0:30:51", "remaining_time": "0:32:31", "throughput": 5819.99, "total_tokens": 10773296} {"current_steps": 16515, "total_steps": 33920, "loss": 0.4105, "lr": 6.0932469010258025e-06, "epoch": 9.737617924528301, "percentage": 48.69, "elapsed_time": "0:30:51", "remaining_time": "0:32:31", "throughput": 5819.93, "total_tokens": 10776048} {"current_steps": 16520, "total_steps": 33920, "loss": 0.3266, "lr": 6.0907362930120594e-06, "epoch": 9.74056603773585, "percentage": 48.7, "elapsed_time": "0:30:52", "remaining_time": "0:32:30", "throughput": 5820.22, "total_tokens": 10780080} {"current_steps": 16525, "total_steps": 33920, "loss": 0.3753, "lr": 6.088225396221181e-06, "epoch": 9.743514150943396, "percentage": 48.72, "elapsed_time": "0:30:52", "remaining_time": "0:32:30", "throughput": 5820.27, "total_tokens": 10783344} {"current_steps": 16530, "total_steps": 33920, "loss": 0.3171, "lr": 6.0857142113179415e-06, "epoch": 9.746462264150944, "percentage": 48.73, "elapsed_time": "0:30:53", "remaining_time": "0:32:29", "throughput": 5820.23, "total_tokens": 10786000} {"current_steps": 16535, "total_steps": 33920, "loss": 0.4202, "lr": 6.083202738967182e-06, "epoch": 9.74941037735849, "percentage": 48.75, "elapsed_time": "0:30:53", "remaining_time": "0:32:29", "throughput": 5820.45, "total_tokens": 10789744} {"current_steps": 16540, "total_steps": 33920, "loss": 0.3832, "lr": 6.0806909798338324e-06, "epoch": 9.752358490566039, "percentage": 48.76, "elapsed_time": "0:30:54", "remaining_time": "0:32:28", "throughput": 5820.53, "total_tokens": 10793168} {"current_steps": 16545, "total_steps": 33920, "loss": 0.3651, "lr": 6.0781789345828854e-06, "epoch": 9.755306603773585, "percentage": 48.78, "elapsed_time": "0:30:54", "remaining_time": "0:32:27", "throughput": 5820.5, "total_tokens": 10796016} {"current_steps": 16550, "total_steps": 33920, "loss": 0.4898, "lr": 6.0756666038794195e-06, "epoch": 9.758254716981131, "percentage": 48.79, "elapsed_time": "0:30:55", "remaining_time": "0:32:27", "throughput": 5820.41, "total_tokens": 10798928} {"current_steps": 16555, "total_steps": 33920, "loss": 0.3439, "lr": 6.073153988388586e-06, "epoch": 9.76120283018868, "percentage": 48.81, "elapsed_time": "0:30:55", "remaining_time": "0:32:26", "throughput": 5820.57, "total_tokens": 10802416} {"current_steps": 16560, "total_steps": 33920, "loss": 0.3928, "lr": 6.070641088775608e-06, "epoch": 9.764150943396226, "percentage": 48.82, "elapsed_time": "0:30:56", "remaining_time": "0:32:26", "throughput": 5820.53, "total_tokens": 10805104} {"current_steps": 16565, "total_steps": 33920, "loss": 0.4216, "lr": 6.068127905705787e-06, "epoch": 9.767099056603774, "percentage": 48.84, "elapsed_time": "0:30:56", "remaining_time": "0:32:25", "throughput": 5820.59, "total_tokens": 10808496} {"current_steps": 16570, "total_steps": 33920, "loss": 0.4061, "lr": 6.065614439844501e-06, "epoch": 9.77004716981132, "percentage": 48.85, "elapsed_time": "0:30:57", "remaining_time": "0:32:24", "throughput": 5820.69, "total_tokens": 10811632} {"current_steps": 16575, "total_steps": 33920, "loss": 0.4434, "lr": 6.063100691857198e-06, "epoch": 9.772995283018869, "percentage": 48.86, "elapsed_time": "0:30:57", "remaining_time": "0:32:24", "throughput": 5820.73, "total_tokens": 10814640} {"current_steps": 16580, "total_steps": 33920, "loss": 0.502, "lr": 6.060586662409407e-06, "epoch": 9.775943396226415, "percentage": 48.88, "elapsed_time": "0:30:58", "remaining_time": "0:32:23", "throughput": 5820.85, "total_tokens": 10817840} {"current_steps": 16585, "total_steps": 33920, "loss": 0.4667, "lr": 6.058072352166724e-06, "epoch": 9.778891509433961, "percentage": 48.89, "elapsed_time": "0:30:58", "remaining_time": "0:32:23", "throughput": 5820.93, "total_tokens": 10820944} {"current_steps": 16590, "total_steps": 33920, "loss": 0.3563, "lr": 6.055557761794826e-06, "epoch": 9.78183962264151, "percentage": 48.91, "elapsed_time": "0:30:59", "remaining_time": "0:32:22", "throughput": 5820.92, "total_tokens": 10823760} {"current_steps": 16595, "total_steps": 33920, "loss": 0.3519, "lr": 6.053042891959462e-06, "epoch": 9.784787735849056, "percentage": 48.92, "elapsed_time": "0:30:59", "remaining_time": "0:32:21", "throughput": 5820.83, "total_tokens": 10826224} {"current_steps": 16600, "total_steps": 33920, "loss": 0.3644, "lr": 6.050527743326455e-06, "epoch": 9.787735849056604, "percentage": 48.94, "elapsed_time": "0:31:00", "remaining_time": "0:32:21", "throughput": 5821.09, "total_tokens": 10830288} {"current_steps": 16605, "total_steps": 33920, "loss": 0.3833, "lr": 6.048012316561699e-06, "epoch": 9.79068396226415, "percentage": 48.95, "elapsed_time": "0:31:01", "remaining_time": "0:32:20", "throughput": 5821.19, "total_tokens": 10833392} {"current_steps": 16610, "total_steps": 33920, "loss": 0.377, "lr": 6.045496612331166e-06, "epoch": 9.793632075471699, "percentage": 48.97, "elapsed_time": "0:31:01", "remaining_time": "0:32:19", "throughput": 5821.36, "total_tokens": 10836688} {"current_steps": 16615, "total_steps": 33920, "loss": 0.5257, "lr": 6.0429806313009e-06, "epoch": 9.796580188679245, "percentage": 48.98, "elapsed_time": "0:31:02", "remaining_time": "0:32:19", "throughput": 5821.28, "total_tokens": 10839248} {"current_steps": 16620, "total_steps": 33920, "loss": 0.2781, "lr": 6.040464374137015e-06, "epoch": 9.799528301886792, "percentage": 49.0, "elapsed_time": "0:31:02", "remaining_time": "0:32:18", "throughput": 5821.29, "total_tokens": 10842416} {"current_steps": 16625, "total_steps": 33920, "loss": 0.3882, "lr": 6.0379478415057045e-06, "epoch": 9.80247641509434, "percentage": 49.01, "elapsed_time": "0:31:03", "remaining_time": "0:32:18", "throughput": 5821.26, "total_tokens": 10845136} {"current_steps": 16630, "total_steps": 33920, "loss": 0.2995, "lr": 6.035431034073228e-06, "epoch": 9.805424528301886, "percentage": 49.03, "elapsed_time": "0:31:03", "remaining_time": "0:32:17", "throughput": 5821.33, "total_tokens": 10848272} {"current_steps": 16635, "total_steps": 33920, "loss": 0.3818, "lr": 6.0329139525059235e-06, "epoch": 9.808372641509434, "percentage": 49.04, "elapsed_time": "0:31:04", "remaining_time": "0:32:16", "throughput": 5821.27, "total_tokens": 10850992} {"current_steps": 16640, "total_steps": 33920, "loss": 0.4443, "lr": 6.030396597470198e-06, "epoch": 9.81132075471698, "percentage": 49.06, "elapsed_time": "0:31:04", "remaining_time": "0:32:16", "throughput": 5821.2, "total_tokens": 10854096} {"current_steps": 16645, "total_steps": 33920, "loss": 0.3796, "lr": 6.027878969632534e-06, "epoch": 9.814268867924529, "percentage": 49.07, "elapsed_time": "0:31:05", "remaining_time": "0:32:15", "throughput": 5821.47, "total_tokens": 10857936} {"current_steps": 16650, "total_steps": 33920, "loss": 0.4803, "lr": 6.025361069659482e-06, "epoch": 9.817216981132075, "percentage": 49.09, "elapsed_time": "0:31:05", "remaining_time": "0:32:15", "throughput": 5821.47, "total_tokens": 10860784} {"current_steps": 16655, "total_steps": 33920, "loss": 0.3006, "lr": 6.022842898217668e-06, "epoch": 9.820165094339622, "percentage": 49.1, "elapsed_time": "0:31:06", "remaining_time": "0:32:14", "throughput": 5821.53, "total_tokens": 10863888} {"current_steps": 16660, "total_steps": 33920, "loss": 0.4809, "lr": 6.020324455973788e-06, "epoch": 9.82311320754717, "percentage": 49.12, "elapsed_time": "0:31:06", "remaining_time": "0:32:13", "throughput": 5821.8, "total_tokens": 10867632} {"current_steps": 16665, "total_steps": 33920, "loss": 0.3865, "lr": 6.017805743594612e-06, "epoch": 9.826061320754716, "percentage": 49.13, "elapsed_time": "0:31:07", "remaining_time": "0:32:13", "throughput": 5821.71, "total_tokens": 10870192} {"current_steps": 16670, "total_steps": 33920, "loss": 0.3491, "lr": 6.0152867617469776e-06, "epoch": 9.829009433962264, "percentage": 49.15, "elapsed_time": "0:31:07", "remaining_time": "0:32:12", "throughput": 5821.69, "total_tokens": 10873264} {"current_steps": 16675, "total_steps": 33920, "loss": 0.3091, "lr": 6.012767511097799e-06, "epoch": 9.83195754716981, "percentage": 49.16, "elapsed_time": "0:31:08", "remaining_time": "0:32:12", "throughput": 5821.85, "total_tokens": 10876656} {"current_steps": 16680, "total_steps": 33920, "loss": 0.4253, "lr": 6.010247992314055e-06, "epoch": 9.834905660377359, "percentage": 49.17, "elapsed_time": "0:31:08", "remaining_time": "0:32:11", "throughput": 5821.95, "total_tokens": 10879824} {"current_steps": 16685, "total_steps": 33920, "loss": 0.3466, "lr": 6.007728206062802e-06, "epoch": 9.837853773584905, "percentage": 49.19, "elapsed_time": "0:31:09", "remaining_time": "0:32:10", "throughput": 5821.93, "total_tokens": 10882480} {"current_steps": 16690, "total_steps": 33920, "loss": 0.4112, "lr": 6.005208153011163e-06, "epoch": 9.840801886792454, "percentage": 49.2, "elapsed_time": "0:31:09", "remaining_time": "0:32:10", "throughput": 5822.02, "total_tokens": 10885648} {"current_steps": 16695, "total_steps": 33920, "loss": 0.3063, "lr": 6.0026878338263335e-06, "epoch": 9.84375, "percentage": 49.22, "elapsed_time": "0:31:10", "remaining_time": "0:32:09", "throughput": 5822.1, "total_tokens": 10888880} {"current_steps": 16700, "total_steps": 33920, "loss": 0.4255, "lr": 6.000167249175579e-06, "epoch": 9.846698113207546, "percentage": 49.23, "elapsed_time": "0:31:10", "remaining_time": "0:32:09", "throughput": 5822.18, "total_tokens": 10892304} {"current_steps": 16705, "total_steps": 33920, "loss": 0.5917, "lr": 5.997646399726236e-06, "epoch": 9.849646226415095, "percentage": 49.25, "elapsed_time": "0:31:11", "remaining_time": "0:32:08", "throughput": 5822.13, "total_tokens": 10894960} {"current_steps": 16710, "total_steps": 33920, "loss": 0.3054, "lr": 5.995125286145707e-06, "epoch": 9.852594339622641, "percentage": 49.26, "elapsed_time": "0:31:11", "remaining_time": "0:32:07", "throughput": 5822.15, "total_tokens": 10898352} {"current_steps": 16715, "total_steps": 33920, "loss": 0.4061, "lr": 5.99260390910147e-06, "epoch": 9.85554245283019, "percentage": 49.28, "elapsed_time": "0:31:12", "remaining_time": "0:32:07", "throughput": 5822.21, "total_tokens": 10901456} {"current_steps": 16720, "total_steps": 33920, "loss": 0.3434, "lr": 5.990082269261071e-06, "epoch": 9.858490566037736, "percentage": 49.29, "elapsed_time": "0:31:12", "remaining_time": "0:32:06", "throughput": 5822.34, "total_tokens": 10904560} {"current_steps": 16725, "total_steps": 33920, "loss": 0.4097, "lr": 5.987560367292123e-06, "epoch": 9.861438679245284, "percentage": 49.31, "elapsed_time": "0:31:13", "remaining_time": "0:32:06", "throughput": 5822.55, "total_tokens": 10908080} {"current_steps": 16730, "total_steps": 33920, "loss": 0.3271, "lr": 5.985038203862313e-06, "epoch": 9.86438679245283, "percentage": 49.32, "elapsed_time": "0:31:13", "remaining_time": "0:32:05", "throughput": 5822.6, "total_tokens": 10911056} {"current_steps": 16735, "total_steps": 33920, "loss": 0.2912, "lr": 5.982515779639393e-06, "epoch": 9.867334905660378, "percentage": 49.34, "elapsed_time": "0:31:14", "remaining_time": "0:32:04", "throughput": 5822.79, "total_tokens": 10914384} {"current_steps": 16740, "total_steps": 33920, "loss": 0.4713, "lr": 5.979993095291186e-06, "epoch": 9.870283018867925, "percentage": 49.35, "elapsed_time": "0:31:15", "remaining_time": "0:32:04", "throughput": 5822.93, "total_tokens": 10918000} {"current_steps": 16745, "total_steps": 33920, "loss": 0.2117, "lr": 5.977470151485582e-06, "epoch": 9.873231132075471, "percentage": 49.37, "elapsed_time": "0:31:15", "remaining_time": "0:32:03", "throughput": 5823.0, "total_tokens": 10921104} {"current_steps": 16750, "total_steps": 33920, "loss": 0.328, "lr": 5.974946948890544e-06, "epoch": 9.87617924528302, "percentage": 49.38, "elapsed_time": "0:31:16", "remaining_time": "0:32:03", "throughput": 5823.08, "total_tokens": 10924848} {"current_steps": 16755, "total_steps": 33920, "loss": 0.411, "lr": 5.9724234881740994e-06, "epoch": 9.879127358490566, "percentage": 49.4, "elapsed_time": "0:31:16", "remaining_time": "0:32:02", "throughput": 5823.22, "total_tokens": 10928208} {"current_steps": 16760, "total_steps": 33920, "loss": 0.334, "lr": 5.9698997700043445e-06, "epoch": 9.882075471698114, "percentage": 49.41, "elapsed_time": "0:31:17", "remaining_time": "0:32:02", "throughput": 5823.44, "total_tokens": 10931920} {"current_steps": 16765, "total_steps": 33920, "loss": 0.2803, "lr": 5.9673757950494475e-06, "epoch": 9.88502358490566, "percentage": 49.43, "elapsed_time": "0:31:17", "remaining_time": "0:32:01", "throughput": 5823.66, "total_tokens": 10936016} {"current_steps": 16770, "total_steps": 33920, "loss": 0.4116, "lr": 5.964851563977639e-06, "epoch": 9.887971698113208, "percentage": 49.44, "elapsed_time": "0:31:18", "remaining_time": "0:32:00", "throughput": 5823.43, "total_tokens": 10938224} {"current_steps": 16775, "total_steps": 33920, "loss": 0.2549, "lr": 5.962327077457219e-06, "epoch": 9.890919811320755, "percentage": 49.45, "elapsed_time": "0:31:18", "remaining_time": "0:32:00", "throughput": 5823.24, "total_tokens": 10940816} {"current_steps": 16780, "total_steps": 33920, "loss": 0.4353, "lr": 5.959802336156558e-06, "epoch": 9.893867924528301, "percentage": 49.47, "elapsed_time": "0:31:19", "remaining_time": "0:31:59", "throughput": 5823.11, "total_tokens": 10943536} {"current_steps": 16785, "total_steps": 33920, "loss": 0.367, "lr": 5.957277340744094e-06, "epoch": 9.89681603773585, "percentage": 49.48, "elapsed_time": "0:31:19", "remaining_time": "0:31:59", "throughput": 5823.0, "total_tokens": 10946480} {"current_steps": 16790, "total_steps": 33920, "loss": 0.5593, "lr": 5.954752091888326e-06, "epoch": 9.899764150943396, "percentage": 49.5, "elapsed_time": "0:31:20", "remaining_time": "0:31:58", "throughput": 5823.21, "total_tokens": 10949968} {"current_steps": 16795, "total_steps": 33920, "loss": 0.5114, "lr": 5.952226590257829e-06, "epoch": 9.902712264150944, "percentage": 49.51, "elapsed_time": "0:31:20", "remaining_time": "0:31:57", "throughput": 5823.22, "total_tokens": 10952656} {"current_steps": 16800, "total_steps": 33920, "loss": 0.3066, "lr": 5.949700836521239e-06, "epoch": 9.90566037735849, "percentage": 49.53, "elapsed_time": "0:31:21", "remaining_time": "0:31:57", "throughput": 5822.97, "total_tokens": 10954960} {"current_steps": 16805, "total_steps": 33920, "loss": 0.3967, "lr": 5.947174831347257e-06, "epoch": 9.908608490566039, "percentage": 49.54, "elapsed_time": "0:31:21", "remaining_time": "0:31:56", "throughput": 5822.98, "total_tokens": 10958256} {"current_steps": 16810, "total_steps": 33920, "loss": 0.4072, "lr": 5.944648575404657e-06, "epoch": 9.911556603773585, "percentage": 49.56, "elapsed_time": "0:31:22", "remaining_time": "0:31:56", "throughput": 5823.35, "total_tokens": 10963056} {"current_steps": 16815, "total_steps": 33920, "loss": 0.4447, "lr": 5.942122069362276e-06, "epoch": 9.914504716981131, "percentage": 49.57, "elapsed_time": "0:31:23", "remaining_time": "0:31:55", "throughput": 5823.39, "total_tokens": 10966384} {"current_steps": 16820, "total_steps": 33920, "loss": 0.4194, "lr": 5.939595313889016e-06, "epoch": 9.91745283018868, "percentage": 49.59, "elapsed_time": "0:31:23", "remaining_time": "0:31:55", "throughput": 5823.45, "total_tokens": 10969680} {"current_steps": 16825, "total_steps": 33920, "loss": 0.3625, "lr": 5.937068309653848e-06, "epoch": 9.920400943396226, "percentage": 49.6, "elapsed_time": "0:31:24", "remaining_time": "0:31:54", "throughput": 5823.67, "total_tokens": 10973360} {"current_steps": 16830, "total_steps": 33920, "loss": 0.3913, "lr": 5.934541057325807e-06, "epoch": 9.923349056603774, "percentage": 49.62, "elapsed_time": "0:31:24", "remaining_time": "0:31:53", "throughput": 5823.77, "total_tokens": 10976976} {"current_steps": 16835, "total_steps": 33920, "loss": 0.4516, "lr": 5.932013557573992e-06, "epoch": 9.92629716981132, "percentage": 49.63, "elapsed_time": "0:31:25", "remaining_time": "0:31:53", "throughput": 5824.0, "total_tokens": 10980560} {"current_steps": 16840, "total_steps": 33920, "loss": 0.3088, "lr": 5.929485811067572e-06, "epoch": 9.929245283018869, "percentage": 49.65, "elapsed_time": "0:31:25", "remaining_time": "0:31:52", "throughput": 5824.14, "total_tokens": 10984080} {"current_steps": 16845, "total_steps": 33920, "loss": 0.346, "lr": 5.926957818475778e-06, "epoch": 9.932193396226415, "percentage": 49.66, "elapsed_time": "0:31:26", "remaining_time": "0:31:52", "throughput": 5824.21, "total_tokens": 10987056} {"current_steps": 16850, "total_steps": 33920, "loss": 0.3832, "lr": 5.924429580467905e-06, "epoch": 9.935141509433961, "percentage": 49.68, "elapsed_time": "0:31:26", "remaining_time": "0:31:51", "throughput": 5824.32, "total_tokens": 10990480} {"current_steps": 16855, "total_steps": 33920, "loss": 0.3044, "lr": 5.921901097713317e-06, "epoch": 9.93808962264151, "percentage": 49.69, "elapsed_time": "0:31:27", "remaining_time": "0:31:51", "throughput": 5824.11, "total_tokens": 10993520} {"current_steps": 16860, "total_steps": 33920, "loss": 0.2404, "lr": 5.919372370881442e-06, "epoch": 9.941037735849056, "percentage": 49.71, "elapsed_time": "0:31:28", "remaining_time": "0:31:50", "throughput": 5823.97, "total_tokens": 10996208} {"current_steps": 16865, "total_steps": 33920, "loss": 0.413, "lr": 5.916843400641768e-06, "epoch": 9.943985849056604, "percentage": 49.72, "elapsed_time": "0:31:28", "remaining_time": "0:31:49", "throughput": 5824.23, "total_tokens": 11000016} {"current_steps": 16870, "total_steps": 33920, "loss": 0.3892, "lr": 5.914314187663851e-06, "epoch": 9.94693396226415, "percentage": 49.73, "elapsed_time": "0:31:29", "remaining_time": "0:31:49", "throughput": 5824.22, "total_tokens": 11003024} {"current_steps": 16875, "total_steps": 33920, "loss": 0.3314, "lr": 5.911784732617314e-06, "epoch": 9.949882075471699, "percentage": 49.75, "elapsed_time": "0:31:29", "remaining_time": "0:31:48", "throughput": 5823.92, "total_tokens": 11005168} {"current_steps": 16880, "total_steps": 33920, "loss": 0.3725, "lr": 5.90925503617184e-06, "epoch": 9.952830188679245, "percentage": 49.76, "elapsed_time": "0:31:30", "remaining_time": "0:31:48", "throughput": 5824.01, "total_tokens": 11008336} {"current_steps": 16885, "total_steps": 33920, "loss": 0.4573, "lr": 5.9067250989971745e-06, "epoch": 9.955778301886792, "percentage": 49.78, "elapsed_time": "0:31:30", "remaining_time": "0:31:47", "throughput": 5824.01, "total_tokens": 11011408} {"current_steps": 16890, "total_steps": 33920, "loss": 0.2939, "lr": 5.904194921763133e-06, "epoch": 9.95872641509434, "percentage": 49.79, "elapsed_time": "0:31:31", "remaining_time": "0:31:46", "throughput": 5824.22, "total_tokens": 11014928} {"current_steps": 16895, "total_steps": 33920, "loss": 0.3057, "lr": 5.901664505139589e-06, "epoch": 9.961674528301886, "percentage": 49.81, "elapsed_time": "0:31:31", "remaining_time": "0:31:46", "throughput": 5824.33, "total_tokens": 11018096} {"current_steps": 16900, "total_steps": 33920, "loss": 0.5172, "lr": 5.8991338497964814e-06, "epoch": 9.964622641509434, "percentage": 49.82, "elapsed_time": "0:31:32", "remaining_time": "0:31:45", "throughput": 5824.39, "total_tokens": 11021200} {"current_steps": 16905, "total_steps": 33920, "loss": 0.3481, "lr": 5.896602956403812e-06, "epoch": 9.96757075471698, "percentage": 49.84, "elapsed_time": "0:31:33", "remaining_time": "0:31:45", "throughput": 5824.78, "total_tokens": 11027280} {"current_steps": 16910, "total_steps": 33920, "loss": 0.3502, "lr": 5.894071825631645e-06, "epoch": 9.970518867924529, "percentage": 49.85, "elapsed_time": "0:31:33", "remaining_time": "0:31:44", "throughput": 5824.96, "total_tokens": 11030608} {"current_steps": 16915, "total_steps": 33920, "loss": 0.4036, "lr": 5.891540458150109e-06, "epoch": 9.973466981132075, "percentage": 49.87, "elapsed_time": "0:31:34", "remaining_time": "0:31:44", "throughput": 5825.3, "total_tokens": 11035056} {"current_steps": 16920, "total_steps": 33920, "loss": 0.5076, "lr": 5.889008854629395e-06, "epoch": 9.976415094339622, "percentage": 49.88, "elapsed_time": "0:31:34", "remaining_time": "0:31:43", "throughput": 5825.34, "total_tokens": 11038352} {"current_steps": 16925, "total_steps": 33920, "loss": 0.5762, "lr": 5.886477015739754e-06, "epoch": 9.97936320754717, "percentage": 49.9, "elapsed_time": "0:31:35", "remaining_time": "0:31:43", "throughput": 5825.16, "total_tokens": 11040912} {"current_steps": 16930, "total_steps": 33920, "loss": 0.3954, "lr": 5.883944942151502e-06, "epoch": 9.982311320754716, "percentage": 49.91, "elapsed_time": "0:31:35", "remaining_time": "0:31:42", "throughput": 5825.27, "total_tokens": 11044528} {"current_steps": 16935, "total_steps": 33920, "loss": 0.3634, "lr": 5.88141263453502e-06, "epoch": 9.985259433962264, "percentage": 49.93, "elapsed_time": "0:31:36", "remaining_time": "0:31:42", "throughput": 5825.23, "total_tokens": 11047152} {"current_steps": 16940, "total_steps": 33920, "loss": 0.2998, "lr": 5.878880093560744e-06, "epoch": 9.98820754716981, "percentage": 49.94, "elapsed_time": "0:31:36", "remaining_time": "0:31:41", "throughput": 5825.32, "total_tokens": 11050544} {"current_steps": 16945, "total_steps": 33920, "loss": 0.4117, "lr": 5.876347319899173e-06, "epoch": 9.991155660377359, "percentage": 49.96, "elapsed_time": "0:31:37", "remaining_time": "0:31:40", "throughput": 5825.22, "total_tokens": 11053040} {"current_steps": 16950, "total_steps": 33920, "loss": 0.5502, "lr": 5.873814314220874e-06, "epoch": 9.994103773584905, "percentage": 49.97, "elapsed_time": "0:31:38", "remaining_time": "0:31:40", "throughput": 5825.17, "total_tokens": 11056656} {"current_steps": 16955, "total_steps": 33920, "loss": 0.3848, "lr": 5.871281077196469e-06, "epoch": 9.997051886792454, "percentage": 49.99, "elapsed_time": "0:31:38", "remaining_time": "0:31:39", "throughput": 5825.13, "total_tokens": 11059440} {"current_steps": 16960, "total_steps": 33920, "loss": 0.4427, "lr": 5.868747609496643e-06, "epoch": 10.0, "percentage": 50.0, "elapsed_time": "0:31:39", "remaining_time": "0:31:39", "throughput": 5824.95, "total_tokens": 11063280} {"current_steps": 16960, "total_steps": 33920, "eval_loss": 0.52943354845047, "epoch": 10.0, "percentage": 50.0, "elapsed_time": "0:31:58", "remaining_time": "0:31:58", "throughput": 5766.53, "total_tokens": 11063280} {"current_steps": 16965, "total_steps": 33920, "loss": 0.3382, "lr": 5.8662139117921435e-06, "epoch": 10.002948113207546, "percentage": 50.01, "elapsed_time": "0:32:02", "remaining_time": "0:32:01", "throughput": 5756.7, "total_tokens": 11066480} {"current_steps": 16970, "total_steps": 33920, "loss": 0.3696, "lr": 5.8636799847537785e-06, "epoch": 10.005896226415095, "percentage": 50.03, "elapsed_time": "0:32:02", "remaining_time": "0:32:00", "throughput": 5756.99, "total_tokens": 11070448} {"current_steps": 16975, "total_steps": 33920, "loss": 0.3161, "lr": 5.861145829052415e-06, "epoch": 10.008844339622641, "percentage": 50.04, "elapsed_time": "0:32:03", "remaining_time": "0:32:00", "throughput": 5756.91, "total_tokens": 11073232} {"current_steps": 16980, "total_steps": 33920, "loss": 0.201, "lr": 5.858611445358982e-06, "epoch": 10.01179245283019, "percentage": 50.06, "elapsed_time": "0:32:03", "remaining_time": "0:31:59", "throughput": 5756.88, "total_tokens": 11076016} {"current_steps": 16985, "total_steps": 33920, "loss": 0.3956, "lr": 5.856076834344468e-06, "epoch": 10.014740566037736, "percentage": 50.07, "elapsed_time": "0:32:04", "remaining_time": "0:31:58", "throughput": 5757.16, "total_tokens": 11079760} {"current_steps": 16990, "total_steps": 33920, "loss": 0.4209, "lr": 5.853541996679924e-06, "epoch": 10.017688679245284, "percentage": 50.09, "elapsed_time": "0:32:05", "remaining_time": "0:31:58", "throughput": 5757.17, "total_tokens": 11082608} {"current_steps": 16995, "total_steps": 33920, "loss": 0.3841, "lr": 5.851006933036456e-06, "epoch": 10.02063679245283, "percentage": 50.1, "elapsed_time": "0:32:05", "remaining_time": "0:31:57", "throughput": 5757.0, "total_tokens": 11085616} {"current_steps": 17000, "total_steps": 33920, "loss": 0.433, "lr": 5.848471644085236e-06, "epoch": 10.023584905660377, "percentage": 50.12, "elapsed_time": "0:32:06", "remaining_time": "0:31:57", "throughput": 5757.39, "total_tokens": 11090096} {"current_steps": 17005, "total_steps": 33920, "loss": 0.3709, "lr": 5.84593613049749e-06, "epoch": 10.026533018867925, "percentage": 50.13, "elapsed_time": "0:32:06", "remaining_time": "0:31:56", "throughput": 5757.34, "total_tokens": 11092848} {"current_steps": 17010, "total_steps": 33920, "loss": 0.4307, "lr": 5.843400392944509e-06, "epoch": 10.029481132075471, "percentage": 50.15, "elapsed_time": "0:32:07", "remaining_time": "0:31:55", "throughput": 5757.42, "total_tokens": 11095792} {"current_steps": 17015, "total_steps": 33920, "loss": 0.4455, "lr": 5.840864432097639e-06, "epoch": 10.03242924528302, "percentage": 50.16, "elapsed_time": "0:32:07", "remaining_time": "0:31:55", "throughput": 5757.87, "total_tokens": 11100528} {"current_steps": 17020, "total_steps": 33920, "loss": 0.3511, "lr": 5.838328248628286e-06, "epoch": 10.035377358490566, "percentage": 50.18, "elapsed_time": "0:32:08", "remaining_time": "0:31:54", "throughput": 5757.96, "total_tokens": 11103824} {"current_steps": 17025, "total_steps": 33920, "loss": 0.4317, "lr": 5.835791843207916e-06, "epoch": 10.038325471698114, "percentage": 50.19, "elapsed_time": "0:32:08", "remaining_time": "0:31:54", "throughput": 5758.06, "total_tokens": 11107184} {"current_steps": 17030, "total_steps": 33920, "loss": 0.4389, "lr": 5.833255216508056e-06, "epoch": 10.04127358490566, "percentage": 50.21, "elapsed_time": "0:32:10", "remaining_time": "0:31:54", "throughput": 5758.55, "total_tokens": 11114512} {"current_steps": 17035, "total_steps": 33920, "loss": 0.4194, "lr": 5.830718369200284e-06, "epoch": 10.044221698113208, "percentage": 50.22, "elapsed_time": "0:32:10", "remaining_time": "0:31:53", "throughput": 5758.32, "total_tokens": 11116912} {"current_steps": 17040, "total_steps": 33920, "loss": 0.3677, "lr": 5.828181301956244e-06, "epoch": 10.047169811320755, "percentage": 50.24, "elapsed_time": "0:32:11", "remaining_time": "0:31:52", "throughput": 5758.44, "total_tokens": 11120176} {"current_steps": 17045, "total_steps": 33920, "loss": 0.3028, "lr": 5.825644015447636e-06, "epoch": 10.050117924528301, "percentage": 50.25, "elapsed_time": "0:32:11", "remaining_time": "0:31:52", "throughput": 5758.42, "total_tokens": 11122896} {"current_steps": 17050, "total_steps": 33920, "loss": 0.436, "lr": 5.823106510346216e-06, "epoch": 10.05306603773585, "percentage": 50.27, "elapsed_time": "0:32:12", "remaining_time": "0:31:51", "throughput": 5758.53, "total_tokens": 11126256} {"current_steps": 17055, "total_steps": 33920, "loss": 0.3686, "lr": 5.820568787323798e-06, "epoch": 10.056014150943396, "percentage": 50.28, "elapsed_time": "0:32:12", "remaining_time": "0:31:51", "throughput": 5758.49, "total_tokens": 11129040} {"current_steps": 17060, "total_steps": 33920, "loss": 0.3068, "lr": 5.818030847052258e-06, "epoch": 10.058962264150944, "percentage": 50.29, "elapsed_time": "0:32:13", "remaining_time": "0:31:50", "throughput": 5758.54, "total_tokens": 11132016} {"current_steps": 17065, "total_steps": 33920, "loss": 0.3379, "lr": 5.815492690203528e-06, "epoch": 10.06191037735849, "percentage": 50.31, "elapsed_time": "0:32:13", "remaining_time": "0:31:49", "throughput": 5758.56, "total_tokens": 11134864} {"current_steps": 17070, "total_steps": 33920, "loss": 0.609, "lr": 5.812954317449591e-06, "epoch": 10.064858490566039, "percentage": 50.32, "elapsed_time": "0:32:14", "remaining_time": "0:31:49", "throughput": 5758.61, "total_tokens": 11138032} {"current_steps": 17075, "total_steps": 33920, "loss": 0.3786, "lr": 5.810415729462496e-06, "epoch": 10.067806603773585, "percentage": 50.34, "elapsed_time": "0:32:14", "remaining_time": "0:31:48", "throughput": 5758.6, "total_tokens": 11140944} {"current_steps": 17080, "total_steps": 33920, "loss": 0.3007, "lr": 5.807876926914344e-06, "epoch": 10.070754716981131, "percentage": 50.35, "elapsed_time": "0:32:15", "remaining_time": "0:31:48", "throughput": 5758.7, "total_tokens": 11144496} {"current_steps": 17085, "total_steps": 33920, "loss": 0.3227, "lr": 5.8053379104772935e-06, "epoch": 10.07370283018868, "percentage": 50.37, "elapsed_time": "0:32:15", "remaining_time": "0:31:47", "throughput": 5758.66, "total_tokens": 11147440} {"current_steps": 17090, "total_steps": 33920, "loss": 0.416, "lr": 5.802798680823562e-06, "epoch": 10.076650943396226, "percentage": 50.38, "elapsed_time": "0:32:16", "remaining_time": "0:31:46", "throughput": 5758.55, "total_tokens": 11150032} {"current_steps": 17095, "total_steps": 33920, "loss": 0.3803, "lr": 5.8002592386254186e-06, "epoch": 10.079599056603774, "percentage": 50.4, "elapsed_time": "0:32:16", "remaining_time": "0:31:46", "throughput": 5758.56, "total_tokens": 11152912} {"current_steps": 17100, "total_steps": 33920, "loss": 0.3678, "lr": 5.797719584555192e-06, "epoch": 10.08254716981132, "percentage": 50.41, "elapsed_time": "0:32:17", "remaining_time": "0:31:45", "throughput": 5758.56, "total_tokens": 11155920} {"current_steps": 17105, "total_steps": 33920, "loss": 0.4083, "lr": 5.795179719285269e-06, "epoch": 10.085495283018869, "percentage": 50.43, "elapsed_time": "0:32:17", "remaining_time": "0:31:44", "throughput": 5758.49, "total_tokens": 11158896} {"current_steps": 17110, "total_steps": 33920, "loss": 0.3617, "lr": 5.792639643488086e-06, "epoch": 10.088443396226415, "percentage": 50.44, "elapsed_time": "0:32:18", "remaining_time": "0:31:44", "throughput": 5758.32, "total_tokens": 11161424} {"current_steps": 17115, "total_steps": 33920, "loss": 0.3653, "lr": 5.7900993578361434e-06, "epoch": 10.091391509433961, "percentage": 50.46, "elapsed_time": "0:32:18", "remaining_time": "0:31:43", "throughput": 5758.35, "total_tokens": 11164304} {"current_steps": 17120, "total_steps": 33920, "loss": 0.3009, "lr": 5.7875588630019895e-06, "epoch": 10.09433962264151, "percentage": 50.47, "elapsed_time": "0:32:19", "remaining_time": "0:31:43", "throughput": 5758.54, "total_tokens": 11168048} {"current_steps": 17125, "total_steps": 33920, "loss": 0.2757, "lr": 5.7850181596582335e-06, "epoch": 10.097287735849056, "percentage": 50.49, "elapsed_time": "0:32:19", "remaining_time": "0:31:42", "throughput": 5758.25, "total_tokens": 11170288} {"current_steps": 17130, "total_steps": 33920, "loss": 0.441, "lr": 5.782477248477535e-06, "epoch": 10.100235849056604, "percentage": 50.5, "elapsed_time": "0:32:20", "remaining_time": "0:31:41", "throughput": 5758.22, "total_tokens": 11173296} {"current_steps": 17135, "total_steps": 33920, "loss": 0.3755, "lr": 5.779936130132614e-06, "epoch": 10.10318396226415, "percentage": 50.52, "elapsed_time": "0:32:20", "remaining_time": "0:31:41", "throughput": 5758.43, "total_tokens": 11177072} {"current_steps": 17140, "total_steps": 33920, "loss": 0.3886, "lr": 5.777394805296242e-06, "epoch": 10.106132075471699, "percentage": 50.53, "elapsed_time": "0:32:21", "remaining_time": "0:31:40", "throughput": 5758.47, "total_tokens": 11180720} {"current_steps": 17145, "total_steps": 33920, "loss": 0.3377, "lr": 5.774853274641243e-06, "epoch": 10.109080188679245, "percentage": 50.55, "elapsed_time": "0:32:22", "remaining_time": "0:31:40", "throughput": 5758.38, "total_tokens": 11184144} {"current_steps": 17150, "total_steps": 33920, "loss": 0.3566, "lr": 5.772311538840501e-06, "epoch": 10.112028301886792, "percentage": 50.56, "elapsed_time": "0:32:22", "remaining_time": "0:31:39", "throughput": 5758.27, "total_tokens": 11186928} {"current_steps": 17155, "total_steps": 33920, "loss": 0.375, "lr": 5.76976959856695e-06, "epoch": 10.11497641509434, "percentage": 50.57, "elapsed_time": "0:32:23", "remaining_time": "0:31:39", "throughput": 5758.07, "total_tokens": 11189808} {"current_steps": 17160, "total_steps": 33920, "loss": 0.3196, "lr": 5.767227454493582e-06, "epoch": 10.117924528301886, "percentage": 50.59, "elapsed_time": "0:32:23", "remaining_time": "0:31:38", "throughput": 5757.96, "total_tokens": 11192816} {"current_steps": 17165, "total_steps": 33920, "loss": 0.371, "lr": 5.764685107293436e-06, "epoch": 10.120872641509434, "percentage": 50.6, "elapsed_time": "0:32:24", "remaining_time": "0:31:37", "throughput": 5758.09, "total_tokens": 11196240} {"current_steps": 17170, "total_steps": 33920, "loss": 0.2972, "lr": 5.762142557639614e-06, "epoch": 10.12382075471698, "percentage": 50.62, "elapsed_time": "0:32:25", "remaining_time": "0:31:37", "throughput": 5758.14, "total_tokens": 11199888} {"current_steps": 17175, "total_steps": 33920, "loss": 0.3689, "lr": 5.759599806205266e-06, "epoch": 10.126768867924529, "percentage": 50.63, "elapsed_time": "0:32:25", "remaining_time": "0:31:36", "throughput": 5758.06, "total_tokens": 11202864} {"current_steps": 17180, "total_steps": 33920, "loss": 0.3085, "lr": 5.757056853663594e-06, "epoch": 10.129716981132075, "percentage": 50.65, "elapsed_time": "0:32:26", "remaining_time": "0:31:36", "throughput": 5757.91, "total_tokens": 11205840} {"current_steps": 17185, "total_steps": 33920, "loss": 0.3276, "lr": 5.754513700687858e-06, "epoch": 10.132665094339623, "percentage": 50.66, "elapsed_time": "0:32:26", "remaining_time": "0:31:35", "throughput": 5757.54, "total_tokens": 11208112} {"current_steps": 17190, "total_steps": 33920, "loss": 0.2732, "lr": 5.751970347951369e-06, "epoch": 10.13561320754717, "percentage": 50.68, "elapsed_time": "0:32:27", "remaining_time": "0:31:35", "throughput": 5757.19, "total_tokens": 11210608} {"current_steps": 17195, "total_steps": 33920, "loss": 0.4057, "lr": 5.7494267961274875e-06, "epoch": 10.138561320754716, "percentage": 50.69, "elapsed_time": "0:32:27", "remaining_time": "0:31:34", "throughput": 5757.14, "total_tokens": 11213872} {"current_steps": 17200, "total_steps": 33920, "loss": 0.2573, "lr": 5.746883045889633e-06, "epoch": 10.141509433962264, "percentage": 50.71, "elapsed_time": "0:32:28", "remaining_time": "0:31:33", "throughput": 5757.04, "total_tokens": 11216848} {"current_steps": 17205, "total_steps": 33920, "loss": 0.3192, "lr": 5.744339097911272e-06, "epoch": 10.14445754716981, "percentage": 50.72, "elapsed_time": "0:32:28", "remaining_time": "0:31:33", "throughput": 5756.99, "total_tokens": 11219792} {"current_steps": 17210, "total_steps": 33920, "loss": 0.3808, "lr": 5.741794952865928e-06, "epoch": 10.147405660377359, "percentage": 50.74, "elapsed_time": "0:32:29", "remaining_time": "0:31:32", "throughput": 5756.55, "total_tokens": 11222544} {"current_steps": 17215, "total_steps": 33920, "loss": 0.4416, "lr": 5.739250611427173e-06, "epoch": 10.150353773584905, "percentage": 50.75, "elapsed_time": "0:32:30", "remaining_time": "0:31:32", "throughput": 5756.48, "total_tokens": 11225808} {"current_steps": 17220, "total_steps": 33920, "loss": 0.5447, "lr": 5.736706074268633e-06, "epoch": 10.153301886792454, "percentage": 50.77, "elapsed_time": "0:32:30", "remaining_time": "0:31:31", "throughput": 5756.42, "total_tokens": 11229776} {"current_steps": 17225, "total_steps": 33920, "loss": 0.3847, "lr": 5.734161342063984e-06, "epoch": 10.15625, "percentage": 50.78, "elapsed_time": "0:32:31", "remaining_time": "0:31:31", "throughput": 5756.08, "total_tokens": 11232976} {"current_steps": 17230, "total_steps": 33920, "loss": 0.3187, "lr": 5.731616415486957e-06, "epoch": 10.159198113207546, "percentage": 50.8, "elapsed_time": "0:32:32", "remaining_time": "0:31:30", "throughput": 5755.71, "total_tokens": 11235984} {"current_steps": 17235, "total_steps": 33920, "loss": 0.454, "lr": 5.72907129521133e-06, "epoch": 10.162146226415095, "percentage": 50.81, "elapsed_time": "0:32:32", "remaining_time": "0:31:30", "throughput": 5755.58, "total_tokens": 11239472} {"current_steps": 17240, "total_steps": 33920, "loss": 0.3823, "lr": 5.726525981910935e-06, "epoch": 10.165094339622641, "percentage": 50.83, "elapsed_time": "0:32:33", "remaining_time": "0:31:30", "throughput": 5755.52, "total_tokens": 11243312} {"current_steps": 17245, "total_steps": 33920, "loss": 0.3964, "lr": 5.723980476259658e-06, "epoch": 10.16804245283019, "percentage": 50.84, "elapsed_time": "0:32:34", "remaining_time": "0:31:29", "throughput": 5755.43, "total_tokens": 11246736} {"current_steps": 17250, "total_steps": 33920, "loss": 0.4034, "lr": 5.721434778931426e-06, "epoch": 10.170990566037736, "percentage": 50.85, "elapsed_time": "0:32:34", "remaining_time": "0:31:28", "throughput": 5755.24, "total_tokens": 11249488} {"current_steps": 17255, "total_steps": 33920, "loss": 0.3016, "lr": 5.7188888906002284e-06, "epoch": 10.173938679245284, "percentage": 50.87, "elapsed_time": "0:32:35", "remaining_time": "0:31:28", "throughput": 5755.16, "total_tokens": 11253328} {"current_steps": 17260, "total_steps": 33920, "loss": 0.3584, "lr": 5.716342811940098e-06, "epoch": 10.17688679245283, "percentage": 50.88, "elapsed_time": "0:32:35", "remaining_time": "0:31:27", "throughput": 5755.12, "total_tokens": 11256944} {"current_steps": 17265, "total_steps": 33920, "loss": 0.3687, "lr": 5.713796543625123e-06, "epoch": 10.179834905660377, "percentage": 50.9, "elapsed_time": "0:32:36", "remaining_time": "0:31:27", "throughput": 5754.96, "total_tokens": 11260240} {"current_steps": 17270, "total_steps": 33920, "loss": 0.2955, "lr": 5.711250086329435e-06, "epoch": 10.182783018867925, "percentage": 50.91, "elapsed_time": "0:32:37", "remaining_time": "0:31:26", "throughput": 5754.49, "total_tokens": 11262864} {"current_steps": 17275, "total_steps": 33920, "loss": 0.3456, "lr": 5.7087034407272225e-06, "epoch": 10.185731132075471, "percentage": 50.93, "elapsed_time": "0:32:37", "remaining_time": "0:31:26", "throughput": 5754.22, "total_tokens": 11265744} {"current_steps": 17280, "total_steps": 33920, "loss": 0.3833, "lr": 5.70615660749272e-06, "epoch": 10.18867924528302, "percentage": 50.94, "elapsed_time": "0:32:38", "remaining_time": "0:31:25", "throughput": 5754.12, "total_tokens": 11268528} {"current_steps": 17285, "total_steps": 33920, "loss": 0.5305, "lr": 5.7036095873002106e-06, "epoch": 10.191627358490566, "percentage": 50.96, "elapsed_time": "0:32:38", "remaining_time": "0:31:25", "throughput": 5754.15, "total_tokens": 11271824} {"current_steps": 17290, "total_steps": 33920, "loss": 0.2883, "lr": 5.701062380824032e-06, "epoch": 10.194575471698114, "percentage": 50.97, "elapsed_time": "0:32:39", "remaining_time": "0:31:24", "throughput": 5754.15, "total_tokens": 11275216} {"current_steps": 17295, "total_steps": 33920, "loss": 0.3354, "lr": 5.698514988738566e-06, "epoch": 10.19752358490566, "percentage": 50.99, "elapsed_time": "0:32:40", "remaining_time": "0:31:24", "throughput": 5754.03, "total_tokens": 11278064} {"current_steps": 17300, "total_steps": 33920, "loss": 0.421, "lr": 5.6959674117182465e-06, "epoch": 10.200471698113208, "percentage": 51.0, "elapsed_time": "0:32:40", "remaining_time": "0:31:23", "throughput": 5754.04, "total_tokens": 11282736} {"current_steps": 17305, "total_steps": 33920, "loss": 0.402, "lr": 5.693419650437554e-06, "epoch": 10.203419811320755, "percentage": 51.02, "elapsed_time": "0:32:41", "remaining_time": "0:31:23", "throughput": 5753.65, "total_tokens": 11285200} {"current_steps": 17310, "total_steps": 33920, "loss": 0.3823, "lr": 5.690871705571022e-06, "epoch": 10.206367924528301, "percentage": 51.03, "elapsed_time": "0:32:41", "remaining_time": "0:31:22", "throughput": 5753.22, "total_tokens": 11287376} {"current_steps": 17315, "total_steps": 33920, "loss": 0.4477, "lr": 5.688323577793229e-06, "epoch": 10.20931603773585, "percentage": 51.05, "elapsed_time": "0:32:42", "remaining_time": "0:31:22", "throughput": 5753.04, "total_tokens": 11290288} {"current_steps": 17320, "total_steps": 33920, "loss": 0.4168, "lr": 5.685775267778801e-06, "epoch": 10.212264150943396, "percentage": 51.06, "elapsed_time": "0:32:43", "remaining_time": "0:31:21", "throughput": 5752.83, "total_tokens": 11292976} {"current_steps": 17325, "total_steps": 33920, "loss": 0.4327, "lr": 5.683226776202416e-06, "epoch": 10.215212264150944, "percentage": 51.08, "elapsed_time": "0:32:43", "remaining_time": "0:31:20", "throughput": 5752.92, "total_tokens": 11296656} {"current_steps": 17330, "total_steps": 33920, "loss": 0.48, "lr": 5.680678103738798e-06, "epoch": 10.21816037735849, "percentage": 51.09, "elapsed_time": "0:32:44", "remaining_time": "0:31:20", "throughput": 5752.91, "total_tokens": 11299760} {"current_steps": 17335, "total_steps": 33920, "loss": 0.3417, "lr": 5.678129251062717e-06, "epoch": 10.221108490566039, "percentage": 51.11, "elapsed_time": "0:32:44", "remaining_time": "0:31:19", "throughput": 5752.78, "total_tokens": 11302736} {"current_steps": 17340, "total_steps": 33920, "loss": 0.3446, "lr": 5.675580218848995e-06, "epoch": 10.224056603773585, "percentage": 51.12, "elapsed_time": "0:32:45", "remaining_time": "0:31:19", "throughput": 5752.76, "total_tokens": 11305968} {"current_steps": 17345, "total_steps": 33920, "loss": 0.3756, "lr": 5.673031007772498e-06, "epoch": 10.227004716981131, "percentage": 51.14, "elapsed_time": "0:32:45", "remaining_time": "0:31:18", "throughput": 5752.67, "total_tokens": 11309040} {"current_steps": 17350, "total_steps": 33920, "loss": 0.3604, "lr": 5.670481618508141e-06, "epoch": 10.22995283018868, "percentage": 51.15, "elapsed_time": "0:32:46", "remaining_time": "0:31:17", "throughput": 5752.57, "total_tokens": 11311760} {"current_steps": 17355, "total_steps": 33920, "loss": 0.341, "lr": 5.667932051730887e-06, "epoch": 10.232900943396226, "percentage": 51.16, "elapsed_time": "0:32:46", "remaining_time": "0:31:17", "throughput": 5752.46, "total_tokens": 11314704} {"current_steps": 17360, "total_steps": 33920, "loss": 0.3543, "lr": 5.6653823081157434e-06, "epoch": 10.235849056603774, "percentage": 51.18, "elapsed_time": "0:32:47", "remaining_time": "0:31:16", "throughput": 5752.36, "total_tokens": 11317808} {"current_steps": 17365, "total_steps": 33920, "loss": 0.397, "lr": 5.662832388337766e-06, "epoch": 10.23879716981132, "percentage": 51.19, "elapsed_time": "0:32:48", "remaining_time": "0:31:16", "throughput": 5752.44, "total_tokens": 11320816} {"current_steps": 17370, "total_steps": 33920, "loss": 0.3498, "lr": 5.660282293072057e-06, "epoch": 10.241745283018869, "percentage": 51.21, "elapsed_time": "0:32:48", "remaining_time": "0:31:15", "throughput": 5752.67, "total_tokens": 11325232} {"current_steps": 17375, "total_steps": 33920, "loss": 0.3768, "lr": 5.657732022993765e-06, "epoch": 10.244693396226415, "percentage": 51.22, "elapsed_time": "0:32:49", "remaining_time": "0:31:15", "throughput": 5752.51, "total_tokens": 11328368} {"current_steps": 17380, "total_steps": 33920, "loss": 0.4547, "lr": 5.655181578778085e-06, "epoch": 10.247641509433961, "percentage": 51.24, "elapsed_time": "0:32:49", "remaining_time": "0:31:14", "throughput": 5752.52, "total_tokens": 11331312} {"current_steps": 17385, "total_steps": 33920, "loss": 0.2458, "lr": 5.65263096110026e-06, "epoch": 10.25058962264151, "percentage": 51.25, "elapsed_time": "0:32:50", "remaining_time": "0:31:14", "throughput": 5752.28, "total_tokens": 11334032} {"current_steps": 17390, "total_steps": 33920, "loss": 0.3472, "lr": 5.650080170635573e-06, "epoch": 10.253537735849056, "percentage": 51.27, "elapsed_time": "0:32:50", "remaining_time": "0:31:13", "throughput": 5752.19, "total_tokens": 11337328} {"current_steps": 17395, "total_steps": 33920, "loss": 0.3258, "lr": 5.647529208059359e-06, "epoch": 10.256485849056604, "percentage": 51.28, "elapsed_time": "0:32:51", "remaining_time": "0:31:12", "throughput": 5752.06, "total_tokens": 11340240} {"current_steps": 17400, "total_steps": 33920, "loss": 0.4787, "lr": 5.6449780740469985e-06, "epoch": 10.25943396226415, "percentage": 51.3, "elapsed_time": "0:32:52", "remaining_time": "0:31:12", "throughput": 5752.08, "total_tokens": 11343536} {"current_steps": 17405, "total_steps": 33920, "loss": 0.3464, "lr": 5.642426769273912e-06, "epoch": 10.262382075471699, "percentage": 51.31, "elapsed_time": "0:32:52", "remaining_time": "0:31:11", "throughput": 5752.03, "total_tokens": 11346544} {"current_steps": 17410, "total_steps": 33920, "loss": 0.2924, "lr": 5.63987529441557e-06, "epoch": 10.265330188679245, "percentage": 51.33, "elapsed_time": "0:32:53", "remaining_time": "0:31:11", "throughput": 5752.2, "total_tokens": 11350096} {"current_steps": 17415, "total_steps": 33920, "loss": 0.4884, "lr": 5.637323650147487e-06, "epoch": 10.268278301886792, "percentage": 51.34, "elapsed_time": "0:32:53", "remaining_time": "0:31:10", "throughput": 5751.89, "total_tokens": 11352688} {"current_steps": 17420, "total_steps": 33920, "loss": 0.281, "lr": 5.63477183714522e-06, "epoch": 10.27122641509434, "percentage": 51.36, "elapsed_time": "0:32:54", "remaining_time": "0:31:10", "throughput": 5751.7, "total_tokens": 11355824} {"current_steps": 17425, "total_steps": 33920, "loss": 0.4866, "lr": 5.632219856084373e-06, "epoch": 10.274174528301886, "percentage": 51.37, "elapsed_time": "0:32:54", "remaining_time": "0:31:09", "throughput": 5751.73, "total_tokens": 11359152} {"current_steps": 17430, "total_steps": 33920, "loss": 0.4205, "lr": 5.6296677076405944e-06, "epoch": 10.277122641509434, "percentage": 51.39, "elapsed_time": "0:32:55", "remaining_time": "0:31:08", "throughput": 5751.54, "total_tokens": 11362320} {"current_steps": 17435, "total_steps": 33920, "loss": 0.3303, "lr": 5.627115392489578e-06, "epoch": 10.28007075471698, "percentage": 51.4, "elapsed_time": "0:32:56", "remaining_time": "0:31:08", "throughput": 5751.79, "total_tokens": 11366608} {"current_steps": 17440, "total_steps": 33920, "loss": 0.3174, "lr": 5.624562911307058e-06, "epoch": 10.283018867924529, "percentage": 51.42, "elapsed_time": "0:32:56", "remaining_time": "0:31:07", "throughput": 5751.63, "total_tokens": 11369616} {"current_steps": 17445, "total_steps": 33920, "loss": 0.4381, "lr": 5.622010264768813e-06, "epoch": 10.285966981132075, "percentage": 51.43, "elapsed_time": "0:32:57", "remaining_time": "0:31:07", "throughput": 5751.49, "total_tokens": 11372624} {"current_steps": 17450, "total_steps": 33920, "loss": 0.2626, "lr": 5.619457453550673e-06, "epoch": 10.288915094339623, "percentage": 51.44, "elapsed_time": "0:32:57", "remaining_time": "0:31:06", "throughput": 5751.52, "total_tokens": 11376144} {"current_steps": 17455, "total_steps": 33920, "loss": 0.4153, "lr": 5.616904478328502e-06, "epoch": 10.29186320754717, "percentage": 51.46, "elapsed_time": "0:32:58", "remaining_time": "0:31:06", "throughput": 5751.19, "total_tokens": 11379216} {"current_steps": 17460, "total_steps": 33920, "loss": 0.4119, "lr": 5.6143513397782104e-06, "epoch": 10.294811320754716, "percentage": 51.47, "elapsed_time": "0:32:59", "remaining_time": "0:31:05", "throughput": 5750.9, "total_tokens": 11382032} {"current_steps": 17465, "total_steps": 33920, "loss": 0.4468, "lr": 5.611798038575755e-06, "epoch": 10.297759433962264, "percentage": 51.49, "elapsed_time": "0:32:59", "remaining_time": "0:31:05", "throughput": 5750.81, "total_tokens": 11384752} {"current_steps": 17470, "total_steps": 33920, "loss": 0.2419, "lr": 5.609244575397131e-06, "epoch": 10.30070754716981, "percentage": 51.5, "elapsed_time": "0:33:00", "remaining_time": "0:31:04", "throughput": 5750.8, "total_tokens": 11388048} {"current_steps": 17475, "total_steps": 33920, "loss": 0.3855, "lr": 5.606690950918381e-06, "epoch": 10.303655660377359, "percentage": 51.52, "elapsed_time": "0:33:00", "remaining_time": "0:31:04", "throughput": 5750.83, "total_tokens": 11391152} {"current_steps": 17480, "total_steps": 33920, "loss": 0.3195, "lr": 5.604137165815586e-06, "epoch": 10.306603773584905, "percentage": 51.53, "elapsed_time": "0:33:01", "remaining_time": "0:31:03", "throughput": 5750.92, "total_tokens": 11394864} {"current_steps": 17485, "total_steps": 33920, "loss": 0.3805, "lr": 5.601583220764874e-06, "epoch": 10.309551886792454, "percentage": 51.55, "elapsed_time": "0:33:02", "remaining_time": "0:31:03", "throughput": 5751.06, "total_tokens": 11399984} {"current_steps": 17490, "total_steps": 33920, "loss": 0.3897, "lr": 5.599029116442409e-06, "epoch": 10.3125, "percentage": 51.56, "elapsed_time": "0:33:02", "remaining_time": "0:31:02", "throughput": 5750.88, "total_tokens": 11402864} {"current_steps": 17495, "total_steps": 33920, "loss": 0.3776, "lr": 5.596474853524406e-06, "epoch": 10.315448113207546, "percentage": 51.58, "elapsed_time": "0:33:03", "remaining_time": "0:31:02", "throughput": 5750.43, "total_tokens": 11405232} {"current_steps": 17500, "total_steps": 33920, "loss": 0.5069, "lr": 5.593920432687115e-06, "epoch": 10.318396226415095, "percentage": 51.59, "elapsed_time": "0:33:03", "remaining_time": "0:31:01", "throughput": 5750.31, "total_tokens": 11408048} {"current_steps": 17505, "total_steps": 33920, "loss": 0.3743, "lr": 5.591365854606829e-06, "epoch": 10.321344339622641, "percentage": 51.61, "elapsed_time": "0:33:04", "remaining_time": "0:31:00", "throughput": 5750.47, "total_tokens": 11412016} {"current_steps": 17510, "total_steps": 33920, "loss": 0.3291, "lr": 5.588811119959885e-06, "epoch": 10.32429245283019, "percentage": 51.62, "elapsed_time": "0:33:05", "remaining_time": "0:31:00", "throughput": 5750.4, "total_tokens": 11414960} {"current_steps": 17515, "total_steps": 33920, "loss": 0.684, "lr": 5.58625622942266e-06, "epoch": 10.327240566037736, "percentage": 51.64, "elapsed_time": "0:33:05", "remaining_time": "0:30:59", "throughput": 5750.25, "total_tokens": 11417840} {"current_steps": 17520, "total_steps": 33920, "loss": 0.2969, "lr": 5.58370118367157e-06, "epoch": 10.330188679245284, "percentage": 51.65, "elapsed_time": "0:33:06", "remaining_time": "0:30:59", "throughput": 5750.15, "total_tokens": 11421360} {"current_steps": 17525, "total_steps": 33920, "loss": 0.4068, "lr": 5.581145983383077e-06, "epoch": 10.33313679245283, "percentage": 51.67, "elapsed_time": "0:33:06", "remaining_time": "0:30:58", "throughput": 5749.97, "total_tokens": 11424368} {"current_steps": 17530, "total_steps": 33920, "loss": 0.2624, "lr": 5.57859062923368e-06, "epoch": 10.336084905660377, "percentage": 51.68, "elapsed_time": "0:33:07", "remaining_time": "0:30:58", "throughput": 5749.73, "total_tokens": 11427056} {"current_steps": 17535, "total_steps": 33920, "loss": 0.3341, "lr": 5.5760351218999194e-06, "epoch": 10.339033018867925, "percentage": 51.7, "elapsed_time": "0:33:08", "remaining_time": "0:30:57", "throughput": 5749.83, "total_tokens": 11431152} {"current_steps": 17540, "total_steps": 33920, "loss": 0.4114, "lr": 5.573479462058379e-06, "epoch": 10.341981132075471, "percentage": 51.71, "elapsed_time": "0:33:08", "remaining_time": "0:30:57", "throughput": 5749.54, "total_tokens": 11433680} {"current_steps": 17545, "total_steps": 33920, "loss": 0.3669, "lr": 5.570923650385679e-06, "epoch": 10.34492924528302, "percentage": 51.72, "elapsed_time": "0:33:09", "remaining_time": "0:30:56", "throughput": 5749.27, "total_tokens": 11436208} {"current_steps": 17550, "total_steps": 33920, "loss": 0.4004, "lr": 5.568367687558481e-06, "epoch": 10.347877358490566, "percentage": 51.74, "elapsed_time": "0:33:09", "remaining_time": "0:30:55", "throughput": 5748.76, "total_tokens": 11438384} {"current_steps": 17555, "total_steps": 33920, "loss": 0.4195, "lr": 5.56581157425349e-06, "epoch": 10.350825471698114, "percentage": 51.75, "elapsed_time": "0:33:10", "remaining_time": "0:30:55", "throughput": 5748.53, "total_tokens": 11440976} {"current_steps": 17560, "total_steps": 33920, "loss": 0.3413, "lr": 5.563255311147446e-06, "epoch": 10.35377358490566, "percentage": 51.77, "elapsed_time": "0:33:10", "remaining_time": "0:30:54", "throughput": 5748.72, "total_tokens": 11444816} {"current_steps": 17565, "total_steps": 33920, "loss": 0.3753, "lr": 5.560698898917129e-06, "epoch": 10.356721698113208, "percentage": 51.78, "elapsed_time": "0:33:11", "remaining_time": "0:30:54", "throughput": 5748.46, "total_tokens": 11447376} {"current_steps": 17570, "total_steps": 33920, "loss": 0.3708, "lr": 5.558142338239365e-06, "epoch": 10.359669811320755, "percentage": 51.8, "elapsed_time": "0:33:11", "remaining_time": "0:30:53", "throughput": 5748.58, "total_tokens": 11450896} {"current_steps": 17575, "total_steps": 33920, "loss": 0.4119, "lr": 5.55558562979101e-06, "epoch": 10.362617924528301, "percentage": 51.81, "elapsed_time": "0:33:12", "remaining_time": "0:30:53", "throughput": 5748.25, "total_tokens": 11453584} {"current_steps": 17580, "total_steps": 33920, "loss": 0.4158, "lr": 5.553028774248964e-06, "epoch": 10.36556603773585, "percentage": 51.83, "elapsed_time": "0:33:13", "remaining_time": "0:30:52", "throughput": 5748.04, "total_tokens": 11456272} {"current_steps": 17585, "total_steps": 33920, "loss": 0.3593, "lr": 5.5504717722901665e-06, "epoch": 10.368514150943396, "percentage": 51.84, "elapsed_time": "0:33:13", "remaining_time": "0:30:51", "throughput": 5747.85, "total_tokens": 11459216} {"current_steps": 17590, "total_steps": 33920, "loss": 0.5275, "lr": 5.547914624591597e-06, "epoch": 10.371462264150944, "percentage": 51.86, "elapsed_time": "0:33:14", "remaining_time": "0:30:51", "throughput": 5747.67, "total_tokens": 11462160} {"current_steps": 17595, "total_steps": 33920, "loss": 0.4625, "lr": 5.545357331830269e-06, "epoch": 10.37441037735849, "percentage": 51.87, "elapsed_time": "0:33:14", "remaining_time": "0:30:50", "throughput": 5747.68, "total_tokens": 11465488} {"current_steps": 17600, "total_steps": 33920, "loss": 0.3093, "lr": 5.542799894683235e-06, "epoch": 10.377358490566039, "percentage": 51.89, "elapsed_time": "0:33:15", "remaining_time": "0:30:50", "throughput": 5747.27, "total_tokens": 11467792} {"current_steps": 17605, "total_steps": 33920, "loss": 0.3896, "lr": 5.540242313827591e-06, "epoch": 10.380306603773585, "percentage": 51.9, "elapsed_time": "0:33:15", "remaining_time": "0:30:49", "throughput": 5747.25, "total_tokens": 11470896} {"current_steps": 17610, "total_steps": 33920, "loss": 0.3657, "lr": 5.537684589940466e-06, "epoch": 10.383254716981131, "percentage": 51.92, "elapsed_time": "0:33:16", "remaining_time": "0:30:49", "throughput": 5747.11, "total_tokens": 11473648} {"current_steps": 17615, "total_steps": 33920, "loss": 0.4337, "lr": 5.535126723699029e-06, "epoch": 10.38620283018868, "percentage": 51.93, "elapsed_time": "0:33:17", "remaining_time": "0:30:48", "throughput": 5747.12, "total_tokens": 11477136} {"current_steps": 17620, "total_steps": 33920, "loss": 0.3108, "lr": 5.532568715780485e-06, "epoch": 10.389150943396226, "percentage": 51.95, "elapsed_time": "0:33:17", "remaining_time": "0:30:47", "throughput": 5746.96, "total_tokens": 11480080} {"current_steps": 17625, "total_steps": 33920, "loss": 0.4411, "lr": 5.530010566862077e-06, "epoch": 10.392099056603774, "percentage": 51.96, "elapsed_time": "0:33:18", "remaining_time": "0:30:47", "throughput": 5746.76, "total_tokens": 11482992} {"current_steps": 17630, "total_steps": 33920, "loss": 0.3397, "lr": 5.527452277621089e-06, "epoch": 10.39504716981132, "percentage": 51.98, "elapsed_time": "0:33:18", "remaining_time": "0:30:46", "throughput": 5746.77, "total_tokens": 11486512} {"current_steps": 17635, "total_steps": 33920, "loss": 0.4316, "lr": 5.524893848734837e-06, "epoch": 10.397995283018869, "percentage": 51.99, "elapsed_time": "0:33:19", "remaining_time": "0:30:46", "throughput": 5746.84, "total_tokens": 11490448} {"current_steps": 17640, "total_steps": 33920, "loss": 0.4368, "lr": 5.522335280880676e-06, "epoch": 10.400943396226415, "percentage": 52.0, "elapsed_time": "0:33:19", "remaining_time": "0:30:45", "throughput": 5746.8, "total_tokens": 11493520} {"current_steps": 17645, "total_steps": 33920, "loss": 0.3717, "lr": 5.519776574735999e-06, "epoch": 10.403891509433961, "percentage": 52.02, "elapsed_time": "0:33:20", "remaining_time": "0:30:45", "throughput": 5746.88, "total_tokens": 11497232} {"current_steps": 17650, "total_steps": 33920, "loss": 0.3409, "lr": 5.5172177309782325e-06, "epoch": 10.40683962264151, "percentage": 52.03, "elapsed_time": "0:33:21", "remaining_time": "0:30:44", "throughput": 5746.96, "total_tokens": 11501072} {"current_steps": 17655, "total_steps": 33920, "loss": 0.4006, "lr": 5.514658750284844e-06, "epoch": 10.409787735849056, "percentage": 52.05, "elapsed_time": "0:33:21", "remaining_time": "0:30:44", "throughput": 5747.23, "total_tokens": 11504880} {"current_steps": 17660, "total_steps": 33920, "loss": 0.317, "lr": 5.512099633333332e-06, "epoch": 10.412735849056604, "percentage": 52.06, "elapsed_time": "0:33:22", "remaining_time": "0:30:43", "throughput": 5747.35, "total_tokens": 11508336} {"current_steps": 17665, "total_steps": 33920, "loss": 0.4241, "lr": 5.509540380801236e-06, "epoch": 10.41568396226415, "percentage": 52.08, "elapsed_time": "0:33:22", "remaining_time": "0:30:43", "throughput": 5747.2, "total_tokens": 11511344} {"current_steps": 17670, "total_steps": 33920, "loss": 0.3733, "lr": 5.506980993366129e-06, "epoch": 10.418632075471699, "percentage": 52.09, "elapsed_time": "0:33:23", "remaining_time": "0:30:42", "throughput": 5747.45, "total_tokens": 11515984} {"current_steps": 17675, "total_steps": 33920, "loss": 0.4111, "lr": 5.504421471705616e-06, "epoch": 10.421580188679245, "percentage": 52.11, "elapsed_time": "0:33:24", "remaining_time": "0:30:42", "throughput": 5747.28, "total_tokens": 11518992} {"current_steps": 17680, "total_steps": 33920, "loss": 0.4107, "lr": 5.501861816497346e-06, "epoch": 10.424528301886792, "percentage": 52.12, "elapsed_time": "0:33:24", "remaining_time": "0:30:41", "throughput": 5747.48, "total_tokens": 11523312} {"current_steps": 17685, "total_steps": 33920, "loss": 0.3727, "lr": 5.499302028418998e-06, "epoch": 10.42747641509434, "percentage": 52.14, "elapsed_time": "0:33:25", "remaining_time": "0:30:41", "throughput": 5747.54, "total_tokens": 11526960} {"current_steps": 17690, "total_steps": 33920, "loss": 0.4616, "lr": 5.496742108148285e-06, "epoch": 10.430424528301886, "percentage": 52.15, "elapsed_time": "0:33:26", "remaining_time": "0:30:40", "throughput": 5747.51, "total_tokens": 11530096} {"current_steps": 17695, "total_steps": 33920, "loss": 0.308, "lr": 5.494182056362959e-06, "epoch": 10.433372641509434, "percentage": 52.17, "elapsed_time": "0:33:26", "remaining_time": "0:30:39", "throughput": 5747.48, "total_tokens": 11533328} {"current_steps": 17700, "total_steps": 33920, "loss": 0.4698, "lr": 5.491621873740804e-06, "epoch": 10.43632075471698, "percentage": 52.18, "elapsed_time": "0:33:27", "remaining_time": "0:30:39", "throughput": 5747.36, "total_tokens": 11536336} {"current_steps": 17705, "total_steps": 33920, "loss": 0.5364, "lr": 5.4890615609596375e-06, "epoch": 10.439268867924529, "percentage": 52.2, "elapsed_time": "0:33:27", "remaining_time": "0:30:38", "throughput": 5747.1, "total_tokens": 11538928} {"current_steps": 17710, "total_steps": 33920, "loss": 0.3848, "lr": 5.486501118697317e-06, "epoch": 10.442216981132075, "percentage": 52.21, "elapsed_time": "0:33:28", "remaining_time": "0:30:38", "throughput": 5746.68, "total_tokens": 11541520} {"current_steps": 17715, "total_steps": 33920, "loss": 0.3601, "lr": 5.483940547631727e-06, "epoch": 10.445165094339623, "percentage": 52.23, "elapsed_time": "0:33:28", "remaining_time": "0:30:37", "throughput": 5746.74, "total_tokens": 11544976} {"current_steps": 17720, "total_steps": 33920, "loss": 0.5124, "lr": 5.481379848440792e-06, "epoch": 10.44811320754717, "percentage": 52.24, "elapsed_time": "0:33:29", "remaining_time": "0:30:37", "throughput": 5747.0, "total_tokens": 11549072} {"current_steps": 17725, "total_steps": 33920, "loss": 0.3794, "lr": 5.478819021802468e-06, "epoch": 10.451061320754716, "percentage": 52.26, "elapsed_time": "0:33:30", "remaining_time": "0:30:36", "throughput": 5746.9, "total_tokens": 11552080} {"current_steps": 17730, "total_steps": 33920, "loss": 0.2933, "lr": 5.476258068394743e-06, "epoch": 10.454009433962264, "percentage": 52.27, "elapsed_time": "0:33:30", "remaining_time": "0:30:36", "throughput": 5747.1, "total_tokens": 11555920} {"current_steps": 17735, "total_steps": 33920, "loss": 0.2379, "lr": 5.473696988895644e-06, "epoch": 10.45695754716981, "percentage": 52.28, "elapsed_time": "0:33:31", "remaining_time": "0:30:35", "throughput": 5747.31, "total_tokens": 11560112} {"current_steps": 17740, "total_steps": 33920, "loss": 0.3868, "lr": 5.471135783983224e-06, "epoch": 10.459905660377359, "percentage": 52.3, "elapsed_time": "0:33:31", "remaining_time": "0:30:35", "throughput": 5747.29, "total_tokens": 11563184} {"current_steps": 17745, "total_steps": 33920, "loss": 0.341, "lr": 5.4685744543355745e-06, "epoch": 10.462853773584905, "percentage": 52.31, "elapsed_time": "0:33:32", "remaining_time": "0:30:34", "throughput": 5747.1, "total_tokens": 11566384} {"current_steps": 17750, "total_steps": 33920, "loss": 0.3955, "lr": 5.466013000630819e-06, "epoch": 10.465801886792454, "percentage": 52.33, "elapsed_time": "0:33:33", "remaining_time": "0:30:33", "throughput": 5747.02, "total_tokens": 11569392} {"current_steps": 17755, "total_steps": 33920, "loss": 0.3669, "lr": 5.463451423547114e-06, "epoch": 10.46875, "percentage": 52.34, "elapsed_time": "0:33:33", "remaining_time": "0:30:33", "throughput": 5747.21, "total_tokens": 11573264} {"current_steps": 17760, "total_steps": 33920, "loss": 0.4188, "lr": 5.460889723762647e-06, "epoch": 10.471698113207546, "percentage": 52.36, "elapsed_time": "0:33:34", "remaining_time": "0:30:32", "throughput": 5747.33, "total_tokens": 11576816} {"current_steps": 17765, "total_steps": 33920, "loss": 0.3481, "lr": 5.458327901955639e-06, "epoch": 10.474646226415095, "percentage": 52.37, "elapsed_time": "0:33:34", "remaining_time": "0:30:32", "throughput": 5747.33, "total_tokens": 11580656} {"current_steps": 17770, "total_steps": 33920, "loss": 0.3316, "lr": 5.455765958804344e-06, "epoch": 10.477594339622641, "percentage": 52.39, "elapsed_time": "0:33:35", "remaining_time": "0:30:31", "throughput": 5747.15, "total_tokens": 11583504} {"current_steps": 17775, "total_steps": 33920, "loss": 0.3063, "lr": 5.4532038949870455e-06, "epoch": 10.48054245283019, "percentage": 52.4, "elapsed_time": "0:33:36", "remaining_time": "0:30:31", "throughput": 5747.19, "total_tokens": 11587056} {"current_steps": 17780, "total_steps": 33920, "loss": 0.4263, "lr": 5.450641711182066e-06, "epoch": 10.483490566037736, "percentage": 52.42, "elapsed_time": "0:33:36", "remaining_time": "0:30:30", "throughput": 5747.16, "total_tokens": 11590448} {"current_steps": 17785, "total_steps": 33920, "loss": 0.3105, "lr": 5.448079408067748e-06, "epoch": 10.486438679245284, "percentage": 52.43, "elapsed_time": "0:33:37", "remaining_time": "0:30:30", "throughput": 5746.96, "total_tokens": 11593200} {"current_steps": 17790, "total_steps": 33920, "loss": 0.3819, "lr": 5.4455169863224775e-06, "epoch": 10.48938679245283, "percentage": 52.45, "elapsed_time": "0:33:37", "remaining_time": "0:30:29", "throughput": 5747.05, "total_tokens": 11596880} {"current_steps": 17795, "total_steps": 33920, "loss": 0.4312, "lr": 5.442954446624664e-06, "epoch": 10.492334905660377, "percentage": 52.46, "elapsed_time": "0:33:38", "remaining_time": "0:30:29", "throughput": 5746.79, "total_tokens": 11599632} {"current_steps": 17800, "total_steps": 33920, "loss": 0.5003, "lr": 5.440391789652752e-06, "epoch": 10.495283018867925, "percentage": 52.48, "elapsed_time": "0:33:39", "remaining_time": "0:30:28", "throughput": 5746.56, "total_tokens": 11602416} {"current_steps": 17805, "total_steps": 33920, "loss": 0.271, "lr": 5.437829016085216e-06, "epoch": 10.498231132075471, "percentage": 52.49, "elapsed_time": "0:33:39", "remaining_time": "0:30:27", "throughput": 5746.3, "total_tokens": 11605008} {"current_steps": 17810, "total_steps": 33920, "loss": 0.3225, "lr": 5.435266126600561e-06, "epoch": 10.50117924528302, "percentage": 52.51, "elapsed_time": "0:33:40", "remaining_time": "0:30:27", "throughput": 5746.21, "total_tokens": 11607856} {"current_steps": 17815, "total_steps": 33920, "loss": 0.4079, "lr": 5.4327031218773215e-06, "epoch": 10.504127358490566, "percentage": 52.52, "elapsed_time": "0:33:40", "remaining_time": "0:30:26", "throughput": 5746.21, "total_tokens": 11611184} {"current_steps": 17820, "total_steps": 33920, "loss": 0.3475, "lr": 5.430140002594067e-06, "epoch": 10.507075471698114, "percentage": 52.54, "elapsed_time": "0:33:41", "remaining_time": "0:30:26", "throughput": 5746.36, "total_tokens": 11614704} {"current_steps": 17825, "total_steps": 33920, "loss": 0.378, "lr": 5.4275767694293934e-06, "epoch": 10.51002358490566, "percentage": 52.55, "elapsed_time": "0:33:41", "remaining_time": "0:30:25", "throughput": 5746.25, "total_tokens": 11617584} {"current_steps": 17830, "total_steps": 33920, "loss": 0.4474, "lr": 5.425013423061926e-06, "epoch": 10.512971698113208, "percentage": 52.56, "elapsed_time": "0:33:42", "remaining_time": "0:30:24", "throughput": 5746.11, "total_tokens": 11620464} {"current_steps": 17835, "total_steps": 33920, "loss": 0.2538, "lr": 5.422449964170324e-06, "epoch": 10.515919811320755, "percentage": 52.58, "elapsed_time": "0:33:42", "remaining_time": "0:30:24", "throughput": 5746.24, "total_tokens": 11623696} {"current_steps": 17840, "total_steps": 33920, "loss": 0.397, "lr": 5.419886393433275e-06, "epoch": 10.518867924528301, "percentage": 52.59, "elapsed_time": "0:33:43", "remaining_time": "0:30:23", "throughput": 5746.3, "total_tokens": 11626928} {"current_steps": 17845, "total_steps": 33920, "loss": 0.3661, "lr": 5.417322711529491e-06, "epoch": 10.52181603773585, "percentage": 52.61, "elapsed_time": "0:33:43", "remaining_time": "0:30:23", "throughput": 5746.24, "total_tokens": 11629808} {"current_steps": 17850, "total_steps": 33920, "loss": 0.3338, "lr": 5.4147589191377224e-06, "epoch": 10.524764150943396, "percentage": 52.62, "elapsed_time": "0:33:44", "remaining_time": "0:30:22", "throughput": 5746.39, "total_tokens": 11633584} {"current_steps": 17855, "total_steps": 33920, "loss": 0.5934, "lr": 5.412195016936742e-06, "epoch": 10.527712264150944, "percentage": 52.64, "elapsed_time": "0:33:45", "remaining_time": "0:30:22", "throughput": 5746.45, "total_tokens": 11636816} {"current_steps": 17860, "total_steps": 33920, "loss": 0.4128, "lr": 5.409631005605354e-06, "epoch": 10.53066037735849, "percentage": 52.65, "elapsed_time": "0:33:45", "remaining_time": "0:30:21", "throughput": 5746.51, "total_tokens": 11640048} {"current_steps": 17865, "total_steps": 33920, "loss": 0.2739, "lr": 5.407066885822391e-06, "epoch": 10.533608490566039, "percentage": 52.67, "elapsed_time": "0:33:46", "remaining_time": "0:30:20", "throughput": 5746.41, "total_tokens": 11643184} {"current_steps": 17870, "total_steps": 33920, "loss": 0.3957, "lr": 5.404502658266717e-06, "epoch": 10.536556603773585, "percentage": 52.68, "elapsed_time": "0:33:46", "remaining_time": "0:30:20", "throughput": 5746.38, "total_tokens": 11646608} {"current_steps": 17875, "total_steps": 33920, "loss": 0.4263, "lr": 5.4019383236172195e-06, "epoch": 10.539504716981131, "percentage": 52.7, "elapsed_time": "0:33:47", "remaining_time": "0:30:20", "throughput": 5746.57, "total_tokens": 11652528} {"current_steps": 17880, "total_steps": 33920, "loss": 0.4047, "lr": 5.39937388255282e-06, "epoch": 10.54245283018868, "percentage": 52.71, "elapsed_time": "0:33:48", "remaining_time": "0:30:19", "throughput": 5746.61, "total_tokens": 11656016} {"current_steps": 17885, "total_steps": 33920, "loss": 0.3189, "lr": 5.3968093357524645e-06, "epoch": 10.545400943396226, "percentage": 52.73, "elapsed_time": "0:33:48", "remaining_time": "0:30:19", "throughput": 5746.62, "total_tokens": 11659152} {"current_steps": 17890, "total_steps": 33920, "loss": 0.3136, "lr": 5.3942446838951245e-06, "epoch": 10.548349056603774, "percentage": 52.74, "elapsed_time": "0:33:49", "remaining_time": "0:30:18", "throughput": 5746.67, "total_tokens": 11662416} {"current_steps": 17895, "total_steps": 33920, "loss": 0.4149, "lr": 5.3916799276598074e-06, "epoch": 10.55129716981132, "percentage": 52.76, "elapsed_time": "0:33:50", "remaining_time": "0:30:17", "throughput": 5746.79, "total_tokens": 11666288} {"current_steps": 17900, "total_steps": 33920, "loss": 0.3559, "lr": 5.3891150677255425e-06, "epoch": 10.554245283018869, "percentage": 52.77, "elapsed_time": "0:33:50", "remaining_time": "0:30:17", "throughput": 5746.78, "total_tokens": 11669648} {"current_steps": 17905, "total_steps": 33920, "loss": 0.4641, "lr": 5.386550104771384e-06, "epoch": 10.557193396226415, "percentage": 52.79, "elapsed_time": "0:33:51", "remaining_time": "0:30:16", "throughput": 5747.08, "total_tokens": 11673808} {"current_steps": 17910, "total_steps": 33920, "loss": 0.3883, "lr": 5.3839850394764205e-06, "epoch": 10.560141509433961, "percentage": 52.8, "elapsed_time": "0:33:51", "remaining_time": "0:30:16", "throughput": 5747.06, "total_tokens": 11677136} {"current_steps": 17915, "total_steps": 33920, "loss": 0.307, "lr": 5.381419872519763e-06, "epoch": 10.56308962264151, "percentage": 52.82, "elapsed_time": "0:33:52", "remaining_time": "0:30:15", "throughput": 5747.0, "total_tokens": 11679984} {"current_steps": 17920, "total_steps": 33920, "loss": 0.273, "lr": 5.378854604580549e-06, "epoch": 10.566037735849056, "percentage": 52.83, "elapsed_time": "0:33:52", "remaining_time": "0:30:15", "throughput": 5746.92, "total_tokens": 11682992} {"current_steps": 17925, "total_steps": 33920, "loss": 0.3645, "lr": 5.376289236337946e-06, "epoch": 10.568985849056604, "percentage": 52.84, "elapsed_time": "0:33:53", "remaining_time": "0:30:14", "throughput": 5747.09, "total_tokens": 11687024} {"current_steps": 17930, "total_steps": 33920, "loss": 0.3354, "lr": 5.373723768471147e-06, "epoch": 10.57193396226415, "percentage": 52.86, "elapsed_time": "0:33:54", "remaining_time": "0:30:14", "throughput": 5747.05, "total_tokens": 11690160} {"current_steps": 17935, "total_steps": 33920, "loss": 0.3308, "lr": 5.37115820165937e-06, "epoch": 10.574882075471699, "percentage": 52.87, "elapsed_time": "0:33:54", "remaining_time": "0:30:13", "throughput": 5747.25, "total_tokens": 11694256} {"current_steps": 17940, "total_steps": 33920, "loss": 0.2975, "lr": 5.368592536581858e-06, "epoch": 10.577830188679245, "percentage": 52.89, "elapsed_time": "0:33:55", "remaining_time": "0:30:12", "throughput": 5747.36, "total_tokens": 11697808} {"current_steps": 17945, "total_steps": 33920, "loss": 0.337, "lr": 5.366026773917885e-06, "epoch": 10.580778301886792, "percentage": 52.9, "elapsed_time": "0:33:56", "remaining_time": "0:30:12", "throughput": 5747.49, "total_tokens": 11701904} {"current_steps": 17950, "total_steps": 33920, "loss": 0.325, "lr": 5.363460914346746e-06, "epoch": 10.58372641509434, "percentage": 52.92, "elapsed_time": "0:33:56", "remaining_time": "0:30:11", "throughput": 5747.23, "total_tokens": 11704464} {"current_steps": 17955, "total_steps": 33920, "loss": 0.3533, "lr": 5.360894958547762e-06, "epoch": 10.586674528301886, "percentage": 52.93, "elapsed_time": "0:33:57", "remaining_time": "0:30:11", "throughput": 5747.09, "total_tokens": 11707408} {"current_steps": 17960, "total_steps": 33920, "loss": 0.3972, "lr": 5.358328907200284e-06, "epoch": 10.589622641509434, "percentage": 52.95, "elapsed_time": "0:33:57", "remaining_time": "0:30:10", "throughput": 5746.97, "total_tokens": 11710544} {"current_steps": 17965, "total_steps": 33920, "loss": 0.2769, "lr": 5.355762760983682e-06, "epoch": 10.59257075471698, "percentage": 52.96, "elapsed_time": "0:33:58", "remaining_time": "0:30:10", "throughput": 5747.18, "total_tokens": 11714768} {"current_steps": 17970, "total_steps": 33920, "loss": 0.4167, "lr": 5.353196520577356e-06, "epoch": 10.595518867924529, "percentage": 52.98, "elapsed_time": "0:33:58", "remaining_time": "0:30:09", "throughput": 5747.34, "total_tokens": 11718256} {"current_steps": 17975, "total_steps": 33920, "loss": 0.4275, "lr": 5.35063018666073e-06, "epoch": 10.598466981132075, "percentage": 52.99, "elapsed_time": "0:33:59", "remaining_time": "0:30:09", "throughput": 5747.17, "total_tokens": 11721040} {"current_steps": 17980, "total_steps": 33920, "loss": 0.4001, "lr": 5.3480637599132515e-06, "epoch": 10.601415094339622, "percentage": 53.01, "elapsed_time": "0:34:00", "remaining_time": "0:30:08", "throughput": 5747.21, "total_tokens": 11724592} {"current_steps": 17985, "total_steps": 33920, "loss": 0.3692, "lr": 5.34549724101439e-06, "epoch": 10.60436320754717, "percentage": 53.02, "elapsed_time": "0:34:00", "remaining_time": "0:30:08", "throughput": 5747.5, "total_tokens": 11729200} {"current_steps": 17990, "total_steps": 33920, "loss": 0.4728, "lr": 5.342930630643646e-06, "epoch": 10.607311320754716, "percentage": 53.04, "elapsed_time": "0:34:01", "remaining_time": "0:30:07", "throughput": 5747.39, "total_tokens": 11732368} {"current_steps": 17995, "total_steps": 33920, "loss": 0.3403, "lr": 5.340363929480541e-06, "epoch": 10.610259433962264, "percentage": 53.05, "elapsed_time": "0:34:01", "remaining_time": "0:30:07", "throughput": 5747.39, "total_tokens": 11735856} {"current_steps": 18000, "total_steps": 33920, "loss": 0.4121, "lr": 5.3377971382046164e-06, "epoch": 10.61320754716981, "percentage": 53.07, "elapsed_time": "0:34:02", "remaining_time": "0:30:06", "throughput": 5747.49, "total_tokens": 11739184} {"current_steps": 18005, "total_steps": 33920, "loss": 0.4749, "lr": 5.335230257495446e-06, "epoch": 10.616155660377359, "percentage": 53.08, "elapsed_time": "0:34:02", "remaining_time": "0:30:05", "throughput": 5747.32, "total_tokens": 11741680} {"current_steps": 18010, "total_steps": 33920, "loss": 0.3491, "lr": 5.3326632880326205e-06, "epoch": 10.619103773584905, "percentage": 53.1, "elapsed_time": "0:34:03", "remaining_time": "0:30:05", "throughput": 5747.5, "total_tokens": 11745616} {"current_steps": 18015, "total_steps": 33920, "loss": 0.3061, "lr": 5.3300962304957515e-06, "epoch": 10.622051886792454, "percentage": 53.11, "elapsed_time": "0:34:04", "remaining_time": "0:30:04", "throughput": 5747.4, "total_tokens": 11748528} {"current_steps": 18020, "total_steps": 33920, "loss": 0.4662, "lr": 5.327529085564487e-06, "epoch": 10.625, "percentage": 53.12, "elapsed_time": "0:34:04", "remaining_time": "0:30:04", "throughput": 5747.21, "total_tokens": 11751056} {"current_steps": 18025, "total_steps": 33920, "loss": 0.3393, "lr": 5.324961853918485e-06, "epoch": 10.627948113207546, "percentage": 53.14, "elapsed_time": "0:34:05", "remaining_time": "0:30:03", "throughput": 5747.35, "total_tokens": 11754864} {"current_steps": 18030, "total_steps": 33920, "loss": 0.371, "lr": 5.32239453623743e-06, "epoch": 10.630896226415095, "percentage": 53.15, "elapsed_time": "0:34:05", "remaining_time": "0:30:03", "throughput": 5747.33, "total_tokens": 11758256} {"current_steps": 18035, "total_steps": 33920, "loss": 0.3751, "lr": 5.3198271332010335e-06, "epoch": 10.633844339622641, "percentage": 53.17, "elapsed_time": "0:34:06", "remaining_time": "0:30:02", "throughput": 5747.57, "total_tokens": 11762096} {"current_steps": 18040, "total_steps": 33920, "loss": 0.3324, "lr": 5.317259645489024e-06, "epoch": 10.63679245283019, "percentage": 53.18, "elapsed_time": "0:34:07", "remaining_time": "0:30:01", "throughput": 5747.8, "total_tokens": 11765872} {"current_steps": 18045, "total_steps": 33920, "loss": 0.2893, "lr": 5.314692073781157e-06, "epoch": 10.639740566037736, "percentage": 53.2, "elapsed_time": "0:34:07", "remaining_time": "0:30:01", "throughput": 5747.72, "total_tokens": 11768528} {"current_steps": 18050, "total_steps": 33920, "loss": 0.3557, "lr": 5.312124418757207e-06, "epoch": 10.642688679245284, "percentage": 53.21, "elapsed_time": "0:34:08", "remaining_time": "0:30:00", "throughput": 5747.91, "total_tokens": 11772208} {"current_steps": 18055, "total_steps": 33920, "loss": 0.5397, "lr": 5.309556681096972e-06, "epoch": 10.64563679245283, "percentage": 53.23, "elapsed_time": "0:34:08", "remaining_time": "0:30:00", "throughput": 5748.19, "total_tokens": 11776528} {"current_steps": 18060, "total_steps": 33920, "loss": 0.3975, "lr": 5.306988861480271e-06, "epoch": 10.648584905660378, "percentage": 53.24, "elapsed_time": "0:34:09", "remaining_time": "0:29:59", "throughput": 5748.41, "total_tokens": 11780176} {"current_steps": 18065, "total_steps": 33920, "loss": 0.3357, "lr": 5.304420960586946e-06, "epoch": 10.651533018867925, "percentage": 53.26, "elapsed_time": "0:34:09", "remaining_time": "0:29:59", "throughput": 5748.34, "total_tokens": 11783216} {"current_steps": 18070, "total_steps": 33920, "loss": 0.3338, "lr": 5.3018529790968606e-06, "epoch": 10.654481132075471, "percentage": 53.27, "elapsed_time": "0:34:10", "remaining_time": "0:29:58", "throughput": 5748.89, "total_tokens": 11789904} {"current_steps": 18075, "total_steps": 33920, "loss": 0.4727, "lr": 5.299284917689898e-06, "epoch": 10.65742924528302, "percentage": 53.29, "elapsed_time": "0:34:11", "remaining_time": "0:29:58", "throughput": 5748.87, "total_tokens": 11793040} {"current_steps": 18080, "total_steps": 33920, "loss": 0.3884, "lr": 5.296716777045962e-06, "epoch": 10.660377358490566, "percentage": 53.3, "elapsed_time": "0:34:11", "remaining_time": "0:29:57", "throughput": 5748.85, "total_tokens": 11796336} {"current_steps": 18085, "total_steps": 33920, "loss": 0.3869, "lr": 5.294148557844983e-06, "epoch": 10.663325471698114, "percentage": 53.32, "elapsed_time": "0:34:12", "remaining_time": "0:29:57", "throughput": 5748.82, "total_tokens": 11799568} {"current_steps": 18090, "total_steps": 33920, "loss": 0.3317, "lr": 5.291580260766904e-06, "epoch": 10.66627358490566, "percentage": 53.33, "elapsed_time": "0:34:13", "remaining_time": "0:29:56", "throughput": 5748.9, "total_tokens": 11802960} {"current_steps": 18095, "total_steps": 33920, "loss": 0.3257, "lr": 5.289011886491694e-06, "epoch": 10.669221698113208, "percentage": 53.35, "elapsed_time": "0:34:13", "remaining_time": "0:29:56", "throughput": 5749.15, "total_tokens": 11807088} {"current_steps": 18100, "total_steps": 33920, "loss": 0.3056, "lr": 5.286443435699342e-06, "epoch": 10.672169811320755, "percentage": 53.36, "elapsed_time": "0:34:14", "remaining_time": "0:29:55", "throughput": 5749.26, "total_tokens": 11811920} {"current_steps": 18105, "total_steps": 33920, "loss": 0.407, "lr": 5.283874909069855e-06, "epoch": 10.675117924528301, "percentage": 53.38, "elapsed_time": "0:34:15", "remaining_time": "0:29:55", "throughput": 5749.29, "total_tokens": 11814800} {"current_steps": 18110, "total_steps": 33920, "loss": 0.445, "lr": 5.281306307283263e-06, "epoch": 10.67806603773585, "percentage": 53.39, "elapsed_time": "0:34:15", "remaining_time": "0:29:54", "throughput": 5749.17, "total_tokens": 11818224} {"current_steps": 18115, "total_steps": 33920, "loss": 0.3669, "lr": 5.2787376310196145e-06, "epoch": 10.681014150943396, "percentage": 53.41, "elapsed_time": "0:34:16", "remaining_time": "0:29:53", "throughput": 5749.15, "total_tokens": 11821424} {"current_steps": 18120, "total_steps": 33920, "loss": 0.355, "lr": 5.276168880958977e-06, "epoch": 10.683962264150944, "percentage": 53.42, "elapsed_time": "0:34:16", "remaining_time": "0:29:53", "throughput": 5748.91, "total_tokens": 11823888} {"current_steps": 18125, "total_steps": 33920, "loss": 0.3494, "lr": 5.273600057781437e-06, "epoch": 10.68691037735849, "percentage": 53.43, "elapsed_time": "0:34:17", "remaining_time": "0:29:52", "throughput": 5748.77, "total_tokens": 11826896} {"current_steps": 18130, "total_steps": 33920, "loss": 0.362, "lr": 5.271031162167103e-06, "epoch": 10.689858490566039, "percentage": 53.45, "elapsed_time": "0:34:17", "remaining_time": "0:29:52", "throughput": 5748.82, "total_tokens": 11830224} {"current_steps": 18135, "total_steps": 33920, "loss": 0.3199, "lr": 5.268462194796101e-06, "epoch": 10.692806603773585, "percentage": 53.46, "elapsed_time": "0:34:18", "remaining_time": "0:29:51", "throughput": 5748.94, "total_tokens": 11833456} {"current_steps": 18140, "total_steps": 33920, "loss": 0.4827, "lr": 5.265893156348576e-06, "epoch": 10.695754716981131, "percentage": 53.48, "elapsed_time": "0:34:18", "remaining_time": "0:29:51", "throughput": 5748.94, "total_tokens": 11836848} {"current_steps": 18145, "total_steps": 33920, "loss": 0.4115, "lr": 5.2633240475046925e-06, "epoch": 10.69870283018868, "percentage": 53.49, "elapsed_time": "0:34:19", "remaining_time": "0:29:50", "throughput": 5748.7, "total_tokens": 11839504} {"current_steps": 18150, "total_steps": 33920, "loss": 0.4453, "lr": 5.2607548689446305e-06, "epoch": 10.701650943396226, "percentage": 53.51, "elapsed_time": "0:34:20", "remaining_time": "0:29:49", "throughput": 5748.71, "total_tokens": 11842640} {"current_steps": 18155, "total_steps": 33920, "loss": 0.3442, "lr": 5.258185621348595e-06, "epoch": 10.704599056603774, "percentage": 53.52, "elapsed_time": "0:34:20", "remaining_time": "0:29:49", "throughput": 5748.3, "total_tokens": 11844592} {"current_steps": 18160, "total_steps": 33920, "loss": 0.5397, "lr": 5.255616305396801e-06, "epoch": 10.70754716981132, "percentage": 53.54, "elapsed_time": "0:34:21", "remaining_time": "0:29:48", "throughput": 5748.34, "total_tokens": 11847696} {"current_steps": 18165, "total_steps": 33920, "loss": 0.3407, "lr": 5.253046921769491e-06, "epoch": 10.710495283018869, "percentage": 53.55, "elapsed_time": "0:34:21", "remaining_time": "0:29:48", "throughput": 5748.37, "total_tokens": 11850672} {"current_steps": 18170, "total_steps": 33920, "loss": 0.3258, "lr": 5.250477471146916e-06, "epoch": 10.713443396226415, "percentage": 53.57, "elapsed_time": "0:34:22", "remaining_time": "0:29:47", "throughput": 5748.57, "total_tokens": 11854480} {"current_steps": 18175, "total_steps": 33920, "loss": 0.2342, "lr": 5.2479079542093535e-06, "epoch": 10.716391509433961, "percentage": 53.58, "elapsed_time": "0:34:22", "remaining_time": "0:29:46", "throughput": 5748.76, "total_tokens": 11858032} {"current_steps": 18180, "total_steps": 33920, "loss": 0.3329, "lr": 5.245338371637091e-06, "epoch": 10.71933962264151, "percentage": 53.6, "elapsed_time": "0:34:23", "remaining_time": "0:29:46", "throughput": 5748.75, "total_tokens": 11861296} {"current_steps": 18185, "total_steps": 33920, "loss": 0.4341, "lr": 5.242768724110437e-06, "epoch": 10.722287735849056, "percentage": 53.61, "elapsed_time": "0:34:23", "remaining_time": "0:29:45", "throughput": 5748.38, "total_tokens": 11863344} {"current_steps": 18190, "total_steps": 33920, "loss": 0.3417, "lr": 5.240199012309717e-06, "epoch": 10.725235849056604, "percentage": 53.63, "elapsed_time": "0:34:24", "remaining_time": "0:29:45", "throughput": 5748.37, "total_tokens": 11866704} {"current_steps": 18195, "total_steps": 33920, "loss": 0.3639, "lr": 5.237629236915273e-06, "epoch": 10.72818396226415, "percentage": 53.64, "elapsed_time": "0:34:24", "remaining_time": "0:29:44", "throughput": 5748.29, "total_tokens": 11869648} {"current_steps": 18200, "total_steps": 33920, "loss": 0.4036, "lr": 5.235059398607464e-06, "epoch": 10.731132075471699, "percentage": 53.66, "elapsed_time": "0:34:25", "remaining_time": "0:29:44", "throughput": 5748.4, "total_tokens": 11873040} {"current_steps": 18205, "total_steps": 33920, "loss": 0.328, "lr": 5.232489498066665e-06, "epoch": 10.734080188679245, "percentage": 53.67, "elapsed_time": "0:34:25", "remaining_time": "0:29:43", "throughput": 5748.44, "total_tokens": 11876176} {"current_steps": 18210, "total_steps": 33920, "loss": 0.4602, "lr": 5.229919535973272e-06, "epoch": 10.737028301886792, "percentage": 53.69, "elapsed_time": "0:34:26", "remaining_time": "0:29:42", "throughput": 5748.38, "total_tokens": 11878864} {"current_steps": 18215, "total_steps": 33920, "loss": 0.3387, "lr": 5.2273495130076905e-06, "epoch": 10.73997641509434, "percentage": 53.7, "elapsed_time": "0:34:27", "remaining_time": "0:29:42", "throughput": 5748.43, "total_tokens": 11882192} {"current_steps": 18220, "total_steps": 33920, "loss": 0.3297, "lr": 5.224779429850344e-06, "epoch": 10.742924528301886, "percentage": 53.71, "elapsed_time": "0:34:27", "remaining_time": "0:29:41", "throughput": 5748.17, "total_tokens": 11885040} {"current_steps": 18225, "total_steps": 33920, "loss": 0.3419, "lr": 5.222209287181677e-06, "epoch": 10.745872641509434, "percentage": 53.73, "elapsed_time": "0:34:28", "remaining_time": "0:29:41", "throughput": 5748.07, "total_tokens": 11888112} {"current_steps": 18230, "total_steps": 33920, "loss": 0.2961, "lr": 5.219639085682142e-06, "epoch": 10.74882075471698, "percentage": 53.74, "elapsed_time": "0:34:28", "remaining_time": "0:29:40", "throughput": 5748.15, "total_tokens": 11891440} {"current_steps": 18235, "total_steps": 33920, "loss": 0.3792, "lr": 5.2170688260322124e-06, "epoch": 10.751768867924529, "percentage": 53.76, "elapsed_time": "0:34:29", "remaining_time": "0:29:39", "throughput": 5748.01, "total_tokens": 11894224} {"current_steps": 18240, "total_steps": 33920, "loss": 0.4167, "lr": 5.214498508912376e-06, "epoch": 10.754716981132075, "percentage": 53.77, "elapsed_time": "0:34:29", "remaining_time": "0:29:39", "throughput": 5748.26, "total_tokens": 11898384} {"current_steps": 18245, "total_steps": 33920, "loss": 0.293, "lr": 5.211928135003135e-06, "epoch": 10.757665094339622, "percentage": 53.79, "elapsed_time": "0:34:30", "remaining_time": "0:29:38", "throughput": 5748.25, "total_tokens": 11901296} {"current_steps": 18250, "total_steps": 33920, "loss": 0.4455, "lr": 5.209357704985007e-06, "epoch": 10.76061320754717, "percentage": 53.8, "elapsed_time": "0:34:30", "remaining_time": "0:29:38", "throughput": 5748.29, "total_tokens": 11904336} {"current_steps": 18255, "total_steps": 33920, "loss": 0.3935, "lr": 5.206787219538524e-06, "epoch": 10.763561320754716, "percentage": 53.82, "elapsed_time": "0:34:31", "remaining_time": "0:29:37", "throughput": 5748.41, "total_tokens": 11907760} {"current_steps": 18260, "total_steps": 33920, "loss": 0.385, "lr": 5.204216679344234e-06, "epoch": 10.766509433962264, "percentage": 53.83, "elapsed_time": "0:34:32", "remaining_time": "0:29:36", "throughput": 5748.28, "total_tokens": 11910544} {"current_steps": 18265, "total_steps": 33920, "loss": 0.3224, "lr": 5.201646085082696e-06, "epoch": 10.76945754716981, "percentage": 53.85, "elapsed_time": "0:34:32", "remaining_time": "0:29:36", "throughput": 5748.07, "total_tokens": 11913200} {"current_steps": 18270, "total_steps": 33920, "loss": 0.3407, "lr": 5.199075437434491e-06, "epoch": 10.772405660377359, "percentage": 53.86, "elapsed_time": "0:34:33", "remaining_time": "0:29:35", "throughput": 5747.98, "total_tokens": 11915856} {"current_steps": 18275, "total_steps": 33920, "loss": 0.4124, "lr": 5.1965047370802046e-06, "epoch": 10.775353773584905, "percentage": 53.88, "elapsed_time": "0:34:33", "remaining_time": "0:29:35", "throughput": 5748.02, "total_tokens": 11919280} {"current_steps": 18280, "total_steps": 33920, "loss": 0.4124, "lr": 5.193933984700441e-06, "epoch": 10.778301886792454, "percentage": 53.89, "elapsed_time": "0:34:34", "remaining_time": "0:29:34", "throughput": 5747.98, "total_tokens": 11922192} {"current_steps": 18285, "total_steps": 33920, "loss": 0.3011, "lr": 5.1913631809758216e-06, "epoch": 10.78125, "percentage": 53.91, "elapsed_time": "0:34:34", "remaining_time": "0:29:34", "throughput": 5748.1, "total_tokens": 11925584} {"current_steps": 18290, "total_steps": 33920, "loss": 0.4597, "lr": 5.188792326586973e-06, "epoch": 10.784198113207546, "percentage": 53.92, "elapsed_time": "0:34:35", "remaining_time": "0:29:33", "throughput": 5748.19, "total_tokens": 11928720} {"current_steps": 18295, "total_steps": 33920, "loss": 0.3354, "lr": 5.186221422214544e-06, "epoch": 10.787146226415095, "percentage": 53.94, "elapsed_time": "0:34:35", "remaining_time": "0:29:32", "throughput": 5748.44, "total_tokens": 11933232} {"current_steps": 18300, "total_steps": 33920, "loss": 0.3631, "lr": 5.1836504685391885e-06, "epoch": 10.790094339622641, "percentage": 53.95, "elapsed_time": "0:34:36", "remaining_time": "0:29:32", "throughput": 5748.46, "total_tokens": 11936208} {"current_steps": 18305, "total_steps": 33920, "loss": 0.3286, "lr": 5.181079466241582e-06, "epoch": 10.79304245283019, "percentage": 53.97, "elapsed_time": "0:34:36", "remaining_time": "0:29:31", "throughput": 5748.44, "total_tokens": 11939504} {"current_steps": 18310, "total_steps": 33920, "loss": 0.4243, "lr": 5.178508416002406e-06, "epoch": 10.795990566037736, "percentage": 53.98, "elapsed_time": "0:34:37", "remaining_time": "0:29:31", "throughput": 5748.22, "total_tokens": 11941872} {"current_steps": 18315, "total_steps": 33920, "loss": 0.2514, "lr": 5.175937318502357e-06, "epoch": 10.798938679245284, "percentage": 53.99, "elapsed_time": "0:34:38", "remaining_time": "0:29:31", "throughput": 5748.72, "total_tokens": 11949072} {"current_steps": 18320, "total_steps": 33920, "loss": 0.3245, "lr": 5.173366174422147e-06, "epoch": 10.80188679245283, "percentage": 54.01, "elapsed_time": "0:34:39", "remaining_time": "0:29:30", "throughput": 5748.7, "total_tokens": 11952144} {"current_steps": 18325, "total_steps": 33920, "loss": 0.6438, "lr": 5.170794984442492e-06, "epoch": 10.804834905660378, "percentage": 54.02, "elapsed_time": "0:34:39", "remaining_time": "0:29:29", "throughput": 5748.47, "total_tokens": 11954640} {"current_steps": 18330, "total_steps": 33920, "loss": 0.2986, "lr": 5.16822374924413e-06, "epoch": 10.807783018867925, "percentage": 54.04, "elapsed_time": "0:34:40", "remaining_time": "0:29:29", "throughput": 5748.52, "total_tokens": 11957968} {"current_steps": 18335, "total_steps": 33920, "loss": 0.4318, "lr": 5.165652469507806e-06, "epoch": 10.810731132075471, "percentage": 54.05, "elapsed_time": "0:34:40", "remaining_time": "0:29:28", "throughput": 5748.45, "total_tokens": 11960944} {"current_steps": 18340, "total_steps": 33920, "loss": 0.3977, "lr": 5.163081145914276e-06, "epoch": 10.81367924528302, "percentage": 54.07, "elapsed_time": "0:34:41", "remaining_time": "0:29:28", "throughput": 5748.57, "total_tokens": 11964496} {"current_steps": 18345, "total_steps": 33920, "loss": 0.3632, "lr": 5.160509779144311e-06, "epoch": 10.816627358490566, "percentage": 54.08, "elapsed_time": "0:34:41", "remaining_time": "0:29:27", "throughput": 5748.49, "total_tokens": 11967152} {"current_steps": 18350, "total_steps": 33920, "loss": 0.394, "lr": 5.157938369878688e-06, "epoch": 10.819575471698114, "percentage": 54.1, "elapsed_time": "0:34:42", "remaining_time": "0:29:26", "throughput": 5748.33, "total_tokens": 11969744} {"current_steps": 18355, "total_steps": 33920, "loss": 0.2809, "lr": 5.155366918798203e-06, "epoch": 10.82252358490566, "percentage": 54.11, "elapsed_time": "0:34:42", "remaining_time": "0:29:26", "throughput": 5748.26, "total_tokens": 11972400} {"current_steps": 18360, "total_steps": 33920, "loss": 0.3309, "lr": 5.152795426583654e-06, "epoch": 10.825471698113208, "percentage": 54.13, "elapsed_time": "0:34:43", "remaining_time": "0:29:25", "throughput": 5748.15, "total_tokens": 11974992} {"current_steps": 18365, "total_steps": 33920, "loss": 0.3745, "lr": 5.15022389391586e-06, "epoch": 10.828419811320755, "percentage": 54.14, "elapsed_time": "0:34:43", "remaining_time": "0:29:24", "throughput": 5748.13, "total_tokens": 11978096} {"current_steps": 18370, "total_steps": 33920, "loss": 0.5072, "lr": 5.147652321475642e-06, "epoch": 10.831367924528301, "percentage": 54.16, "elapsed_time": "0:34:44", "remaining_time": "0:29:24", "throughput": 5748.06, "total_tokens": 11981008} {"current_steps": 18375, "total_steps": 33920, "loss": 0.3936, "lr": 5.145080709943835e-06, "epoch": 10.83431603773585, "percentage": 54.17, "elapsed_time": "0:34:44", "remaining_time": "0:29:23", "throughput": 5748.01, "total_tokens": 11984336} {"current_steps": 18380, "total_steps": 33920, "loss": 0.3093, "lr": 5.142509060001285e-06, "epoch": 10.837264150943396, "percentage": 54.19, "elapsed_time": "0:34:45", "remaining_time": "0:29:23", "throughput": 5747.74, "total_tokens": 11986736} {"current_steps": 18385, "total_steps": 33920, "loss": 0.4739, "lr": 5.139937372328847e-06, "epoch": 10.840212264150944, "percentage": 54.2, "elapsed_time": "0:34:46", "remaining_time": "0:29:22", "throughput": 5747.94, "total_tokens": 11990608} {"current_steps": 18390, "total_steps": 33920, "loss": 0.3725, "lr": 5.1373656476073876e-06, "epoch": 10.84316037735849, "percentage": 54.22, "elapsed_time": "0:34:46", "remaining_time": "0:29:22", "throughput": 5747.94, "total_tokens": 11993552} {"current_steps": 18395, "total_steps": 33920, "loss": 0.3775, "lr": 5.134793886517779e-06, "epoch": 10.846108490566039, "percentage": 54.23, "elapsed_time": "0:34:47", "remaining_time": "0:29:21", "throughput": 5747.6, "total_tokens": 11995952} {"current_steps": 18400, "total_steps": 33920, "loss": 0.3981, "lr": 5.1322220897409105e-06, "epoch": 10.849056603773585, "percentage": 54.25, "elapsed_time": "0:34:47", "remaining_time": "0:29:20", "throughput": 5747.64, "total_tokens": 11999376} {"current_steps": 18405, "total_steps": 33920, "loss": 0.4274, "lr": 5.129650257957671e-06, "epoch": 10.852004716981131, "percentage": 54.26, "elapsed_time": "0:34:48", "remaining_time": "0:29:20", "throughput": 5747.88, "total_tokens": 12003312} {"current_steps": 18410, "total_steps": 33920, "loss": 0.4039, "lr": 5.12707839184897e-06, "epoch": 10.85495283018868, "percentage": 54.27, "elapsed_time": "0:34:48", "remaining_time": "0:29:19", "throughput": 5747.7, "total_tokens": 12006416} {"current_steps": 18415, "total_steps": 33920, "loss": 0.3129, "lr": 5.124506492095716e-06, "epoch": 10.857900943396226, "percentage": 54.29, "elapsed_time": "0:34:49", "remaining_time": "0:29:19", "throughput": 5747.79, "total_tokens": 12010160} {"current_steps": 18420, "total_steps": 33920, "loss": 0.3494, "lr": 5.121934559378831e-06, "epoch": 10.860849056603774, "percentage": 54.3, "elapsed_time": "0:34:50", "remaining_time": "0:29:18", "throughput": 5747.97, "total_tokens": 12014256} {"current_steps": 18425, "total_steps": 33920, "loss": 0.426, "lr": 5.1193625943792456e-06, "epoch": 10.86379716981132, "percentage": 54.32, "elapsed_time": "0:34:50", "remaining_time": "0:29:18", "throughput": 5747.97, "total_tokens": 12017456} {"current_steps": 18430, "total_steps": 33920, "loss": 0.3499, "lr": 5.116790597777901e-06, "epoch": 10.866745283018869, "percentage": 54.33, "elapsed_time": "0:34:51", "remaining_time": "0:29:17", "throughput": 5747.92, "total_tokens": 12020720} {"current_steps": 18435, "total_steps": 33920, "loss": 0.2392, "lr": 5.11421857025574e-06, "epoch": 10.869693396226415, "percentage": 54.35, "elapsed_time": "0:34:51", "remaining_time": "0:29:17", "throughput": 5748.06, "total_tokens": 12024080} {"current_steps": 18440, "total_steps": 33920, "loss": 0.3892, "lr": 5.111646512493721e-06, "epoch": 10.872641509433961, "percentage": 54.36, "elapsed_time": "0:34:52", "remaining_time": "0:29:16", "throughput": 5747.93, "total_tokens": 12026736} {"current_steps": 18445, "total_steps": 33920, "loss": 0.3227, "lr": 5.109074425172806e-06, "epoch": 10.87558962264151, "percentage": 54.38, "elapsed_time": "0:34:52", "remaining_time": "0:29:15", "throughput": 5747.83, "total_tokens": 12029296} {"current_steps": 18450, "total_steps": 33920, "loss": 0.3229, "lr": 5.106502308973967e-06, "epoch": 10.878537735849056, "percentage": 54.39, "elapsed_time": "0:34:53", "remaining_time": "0:29:15", "throughput": 5747.88, "total_tokens": 12032880} {"current_steps": 18455, "total_steps": 33920, "loss": 0.4329, "lr": 5.103930164578184e-06, "epoch": 10.881485849056604, "percentage": 54.41, "elapsed_time": "0:34:54", "remaining_time": "0:29:14", "throughput": 5748.04, "total_tokens": 12036912} {"current_steps": 18460, "total_steps": 33920, "loss": 0.3234, "lr": 5.101357992666441e-06, "epoch": 10.88443396226415, "percentage": 54.42, "elapsed_time": "0:34:54", "remaining_time": "0:29:14", "throughput": 5747.83, "total_tokens": 12039632} {"current_steps": 18465, "total_steps": 33920, "loss": 0.422, "lr": 5.098785793919733e-06, "epoch": 10.887382075471699, "percentage": 54.44, "elapsed_time": "0:34:55", "remaining_time": "0:29:13", "throughput": 5748.09, "total_tokens": 12043632} {"current_steps": 18470, "total_steps": 33920, "loss": 0.4758, "lr": 5.096213569019061e-06, "epoch": 10.890330188679245, "percentage": 54.45, "elapsed_time": "0:34:55", "remaining_time": "0:29:13", "throughput": 5748.37, "total_tokens": 12047824} {"current_steps": 18475, "total_steps": 33920, "loss": 0.2931, "lr": 5.0936413186454315e-06, "epoch": 10.893278301886792, "percentage": 54.47, "elapsed_time": "0:34:56", "remaining_time": "0:29:12", "throughput": 5748.18, "total_tokens": 12050480} {"current_steps": 18480, "total_steps": 33920, "loss": 0.4547, "lr": 5.0910690434798584e-06, "epoch": 10.89622641509434, "percentage": 54.48, "elapsed_time": "0:34:56", "remaining_time": "0:29:11", "throughput": 5748.24, "total_tokens": 12053680} {"current_steps": 18485, "total_steps": 33920, "loss": 0.3956, "lr": 5.088496744203364e-06, "epoch": 10.899174528301886, "percentage": 54.5, "elapsed_time": "0:34:57", "remaining_time": "0:29:11", "throughput": 5748.23, "total_tokens": 12056688} {"current_steps": 18490, "total_steps": 33920, "loss": 0.3798, "lr": 5.085924421496976e-06, "epoch": 10.902122641509434, "percentage": 54.51, "elapsed_time": "0:34:58", "remaining_time": "0:29:10", "throughput": 5748.29, "total_tokens": 12060720} {"current_steps": 18495, "total_steps": 33920, "loss": 0.2465, "lr": 5.083352076041725e-06, "epoch": 10.90507075471698, "percentage": 54.53, "elapsed_time": "0:34:58", "remaining_time": "0:29:10", "throughput": 5748.08, "total_tokens": 12063216} {"current_steps": 18500, "total_steps": 33920, "loss": 0.3978, "lr": 5.080779708518654e-06, "epoch": 10.908018867924529, "percentage": 54.54, "elapsed_time": "0:34:59", "remaining_time": "0:29:09", "throughput": 5748.06, "total_tokens": 12066800} {"current_steps": 18505, "total_steps": 33920, "loss": 0.3492, "lr": 5.078207319608807e-06, "epoch": 10.910966981132075, "percentage": 54.55, "elapsed_time": "0:34:59", "remaining_time": "0:29:09", "throughput": 5748.12, "total_tokens": 12070320} {"current_steps": 18510, "total_steps": 33920, "loss": 0.3543, "lr": 5.075634909993235e-06, "epoch": 10.913915094339622, "percentage": 54.57, "elapsed_time": "0:35:00", "remaining_time": "0:29:08", "throughput": 5748.19, "total_tokens": 12073296} {"current_steps": 18515, "total_steps": 33920, "loss": 0.336, "lr": 5.073062480352995e-06, "epoch": 10.91686320754717, "percentage": 54.58, "elapsed_time": "0:35:00", "remaining_time": "0:29:07", "throughput": 5747.87, "total_tokens": 12075472} {"current_steps": 18520, "total_steps": 33920, "loss": 0.395, "lr": 5.070490031369149e-06, "epoch": 10.919811320754716, "percentage": 54.6, "elapsed_time": "0:35:01", "remaining_time": "0:29:07", "throughput": 5747.91, "total_tokens": 12078384} {"current_steps": 18525, "total_steps": 33920, "loss": 0.3274, "lr": 5.067917563722762e-06, "epoch": 10.922759433962264, "percentage": 54.61, "elapsed_time": "0:35:01", "remaining_time": "0:29:06", "throughput": 5748.08, "total_tokens": 12081808} {"current_steps": 18530, "total_steps": 33920, "loss": 0.4302, "lr": 5.065345078094907e-06, "epoch": 10.92570754716981, "percentage": 54.63, "elapsed_time": "0:35:02", "remaining_time": "0:29:06", "throughput": 5748.2, "total_tokens": 12085200} {"current_steps": 18535, "total_steps": 33920, "loss": 0.3497, "lr": 5.062772575166663e-06, "epoch": 10.928655660377359, "percentage": 54.64, "elapsed_time": "0:35:02", "remaining_time": "0:29:05", "throughput": 5748.11, "total_tokens": 12087888} {"current_steps": 18540, "total_steps": 33920, "loss": 0.2891, "lr": 5.0602000556191075e-06, "epoch": 10.931603773584905, "percentage": 54.66, "elapsed_time": "0:35:03", "remaining_time": "0:29:04", "throughput": 5748.06, "total_tokens": 12090608} {"current_steps": 18545, "total_steps": 33920, "loss": 0.2786, "lr": 5.0576275201333284e-06, "epoch": 10.934551886792454, "percentage": 54.67, "elapsed_time": "0:35:04", "remaining_time": "0:29:04", "throughput": 5748.35, "total_tokens": 12094960} {"current_steps": 18550, "total_steps": 33920, "loss": 0.3768, "lr": 5.055054969390415e-06, "epoch": 10.9375, "percentage": 54.69, "elapsed_time": "0:35:04", "remaining_time": "0:29:03", "throughput": 5748.41, "total_tokens": 12098352} {"current_steps": 18555, "total_steps": 33920, "loss": 0.4303, "lr": 5.052482404071461e-06, "epoch": 10.940448113207546, "percentage": 54.7, "elapsed_time": "0:35:05", "remaining_time": "0:29:03", "throughput": 5748.53, "total_tokens": 12101840} {"current_steps": 18560, "total_steps": 33920, "loss": 0.4604, "lr": 5.049909824857564e-06, "epoch": 10.943396226415095, "percentage": 54.72, "elapsed_time": "0:35:05", "remaining_time": "0:29:02", "throughput": 5748.75, "total_tokens": 12106256} {"current_steps": 18565, "total_steps": 33920, "loss": 0.4776, "lr": 5.047337232429827e-06, "epoch": 10.946344339622641, "percentage": 54.73, "elapsed_time": "0:35:06", "remaining_time": "0:29:02", "throughput": 5748.52, "total_tokens": 12108528} {"current_steps": 18570, "total_steps": 33920, "loss": 0.3411, "lr": 5.044764627469354e-06, "epoch": 10.94929245283019, "percentage": 54.75, "elapsed_time": "0:35:06", "remaining_time": "0:29:01", "throughput": 5748.66, "total_tokens": 12111920} {"current_steps": 18575, "total_steps": 33920, "loss": 0.3128, "lr": 5.042192010657251e-06, "epoch": 10.952240566037736, "percentage": 54.76, "elapsed_time": "0:35:07", "remaining_time": "0:29:00", "throughput": 5748.78, "total_tokens": 12115024} {"current_steps": 18580, "total_steps": 33920, "loss": 0.3344, "lr": 5.039619382674632e-06, "epoch": 10.955188679245284, "percentage": 54.78, "elapsed_time": "0:35:07", "remaining_time": "0:29:00", "throughput": 5748.85, "total_tokens": 12118096} {"current_steps": 18585, "total_steps": 33920, "loss": 0.3442, "lr": 5.0370467442026115e-06, "epoch": 10.95813679245283, "percentage": 54.79, "elapsed_time": "0:35:08", "remaining_time": "0:28:59", "throughput": 5749.03, "total_tokens": 12122224} {"current_steps": 18590, "total_steps": 33920, "loss": 0.3679, "lr": 5.034474095922304e-06, "epoch": 10.961084905660378, "percentage": 54.81, "elapsed_time": "0:35:09", "remaining_time": "0:28:59", "throughput": 5749.17, "total_tokens": 12125552} {"current_steps": 18595, "total_steps": 33920, "loss": 0.2092, "lr": 5.031901438514832e-06, "epoch": 10.964033018867925, "percentage": 54.82, "elapsed_time": "0:35:09", "remaining_time": "0:28:58", "throughput": 5749.43, "total_tokens": 12129232} {"current_steps": 18600, "total_steps": 33920, "loss": 0.4918, "lr": 5.0293287726613185e-06, "epoch": 10.966981132075471, "percentage": 54.83, "elapsed_time": "0:35:10", "remaining_time": "0:28:58", "throughput": 5749.43, "total_tokens": 12132176} {"current_steps": 18605, "total_steps": 33920, "loss": 0.4941, "lr": 5.0267560990428836e-06, "epoch": 10.96992924528302, "percentage": 54.85, "elapsed_time": "0:35:10", "remaining_time": "0:28:57", "throughput": 5749.58, "total_tokens": 12135600} {"current_steps": 18610, "total_steps": 33920, "loss": 0.3432, "lr": 5.024183418340657e-06, "epoch": 10.972877358490566, "percentage": 54.86, "elapsed_time": "0:35:11", "remaining_time": "0:28:56", "throughput": 5749.74, "total_tokens": 12139088} {"current_steps": 18615, "total_steps": 33920, "loss": 0.2516, "lr": 5.021610731235766e-06, "epoch": 10.975825471698114, "percentage": 54.88, "elapsed_time": "0:35:11", "remaining_time": "0:28:56", "throughput": 5749.97, "total_tokens": 12143024} {"current_steps": 18620, "total_steps": 33920, "loss": 0.3362, "lr": 5.01903803840934e-06, "epoch": 10.97877358490566, "percentage": 54.89, "elapsed_time": "0:35:12", "remaining_time": "0:28:55", "throughput": 5750.12, "total_tokens": 12146640} {"current_steps": 18625, "total_steps": 33920, "loss": 0.3411, "lr": 5.016465340542514e-06, "epoch": 10.981721698113208, "percentage": 54.91, "elapsed_time": "0:35:13", "remaining_time": "0:28:55", "throughput": 5750.35, "total_tokens": 12150704} {"current_steps": 18630, "total_steps": 33920, "loss": 0.3694, "lr": 5.013892638316417e-06, "epoch": 10.984669811320755, "percentage": 54.92, "elapsed_time": "0:35:13", "remaining_time": "0:28:54", "throughput": 5750.69, "total_tokens": 12155920} {"current_steps": 18635, "total_steps": 33920, "loss": 0.377, "lr": 5.011319932412182e-06, "epoch": 10.987617924528301, "percentage": 54.94, "elapsed_time": "0:35:14", "remaining_time": "0:28:54", "throughput": 5750.52, "total_tokens": 12158352} {"current_steps": 18640, "total_steps": 33920, "loss": 0.2736, "lr": 5.008747223510947e-06, "epoch": 10.99056603773585, "percentage": 54.95, "elapsed_time": "0:35:14", "remaining_time": "0:28:53", "throughput": 5750.78, "total_tokens": 12162512} {"current_steps": 18645, "total_steps": 33920, "loss": 0.3488, "lr": 5.006174512293849e-06, "epoch": 10.993514150943396, "percentage": 54.97, "elapsed_time": "0:35:15", "remaining_time": "0:28:53", "throughput": 5750.71, "total_tokens": 12165296} {"current_steps": 18650, "total_steps": 33920, "loss": 0.3677, "lr": 5.003601799442019e-06, "epoch": 10.996462264150944, "percentage": 54.98, "elapsed_time": "0:35:15", "remaining_time": "0:28:52", "throughput": 5750.83, "total_tokens": 12168720} {"current_steps": 18655, "total_steps": 33920, "loss": 0.4537, "lr": 5.0010290856366e-06, "epoch": 10.99941037735849, "percentage": 55.0, "elapsed_time": "0:35:16", "remaining_time": "0:28:51", "throughput": 5750.95, "total_tokens": 12171856} {"current_steps": 18660, "total_steps": 33920, "loss": 0.2664, "lr": 4.998456371558726e-06, "epoch": 11.002358490566039, "percentage": 55.01, "elapsed_time": "0:35:17", "remaining_time": "0:28:51", "throughput": 5749.99, "total_tokens": 12174800} {"current_steps": 18665, "total_steps": 33920, "loss": 0.4325, "lr": 4.995883657889531e-06, "epoch": 11.005306603773585, "percentage": 55.03, "elapsed_time": "0:35:17", "remaining_time": "0:28:51", "throughput": 5750.19, "total_tokens": 12178544} {"current_steps": 18670, "total_steps": 33920, "loss": 0.3309, "lr": 4.993310945310158e-06, "epoch": 11.008254716981131, "percentage": 55.04, "elapsed_time": "0:35:18", "remaining_time": "0:28:50", "throughput": 5750.37, "total_tokens": 12182192} {"current_steps": 18675, "total_steps": 33920, "loss": 0.3315, "lr": 4.9907382345017416e-06, "epoch": 11.01120283018868, "percentage": 55.06, "elapsed_time": "0:35:19", "remaining_time": "0:28:49", "throughput": 5750.54, "total_tokens": 12185552} {"current_steps": 18680, "total_steps": 33920, "loss": 0.4825, "lr": 4.988165526145416e-06, "epoch": 11.014150943396226, "percentage": 55.07, "elapsed_time": "0:35:19", "remaining_time": "0:28:49", "throughput": 5750.42, "total_tokens": 12188176} {"current_steps": 18685, "total_steps": 33920, "loss": 0.29, "lr": 4.985592820922319e-06, "epoch": 11.017099056603774, "percentage": 55.09, "elapsed_time": "0:35:20", "remaining_time": "0:28:48", "throughput": 5750.33, "total_tokens": 12191152} {"current_steps": 18690, "total_steps": 33920, "loss": 0.3524, "lr": 4.983020119513586e-06, "epoch": 11.02004716981132, "percentage": 55.1, "elapsed_time": "0:35:20", "remaining_time": "0:28:48", "throughput": 5750.34, "total_tokens": 12194448} {"current_steps": 18695, "total_steps": 33920, "loss": 0.3198, "lr": 4.9804474226003465e-06, "epoch": 11.022995283018869, "percentage": 55.11, "elapsed_time": "0:35:21", "remaining_time": "0:28:47", "throughput": 5750.47, "total_tokens": 12197776} {"current_steps": 18700, "total_steps": 33920, "loss": 0.342, "lr": 4.977874730863739e-06, "epoch": 11.025943396226415, "percentage": 55.13, "elapsed_time": "0:35:21", "remaining_time": "0:28:46", "throughput": 5750.63, "total_tokens": 12201424} {"current_steps": 18705, "total_steps": 33920, "loss": 0.3029, "lr": 4.975302044984889e-06, "epoch": 11.028891509433961, "percentage": 55.14, "elapsed_time": "0:35:22", "remaining_time": "0:28:46", "throughput": 5750.46, "total_tokens": 12204016} {"current_steps": 18710, "total_steps": 33920, "loss": 0.3925, "lr": 4.972729365644931e-06, "epoch": 11.03183962264151, "percentage": 55.16, "elapsed_time": "0:35:22", "remaining_time": "0:28:45", "throughput": 5750.35, "total_tokens": 12207120} {"current_steps": 18715, "total_steps": 33920, "loss": 0.5008, "lr": 4.97015669352499e-06, "epoch": 11.034787735849056, "percentage": 55.17, "elapsed_time": "0:35:23", "remaining_time": "0:28:45", "throughput": 5750.59, "total_tokens": 12210992} {"current_steps": 18720, "total_steps": 33920, "loss": 0.3703, "lr": 4.967584029306194e-06, "epoch": 11.037735849056604, "percentage": 55.19, "elapsed_time": "0:35:24", "remaining_time": "0:28:44", "throughput": 5750.86, "total_tokens": 12215184} {"current_steps": 18725, "total_steps": 33920, "loss": 0.3677, "lr": 4.965011373669666e-06, "epoch": 11.04068396226415, "percentage": 55.2, "elapsed_time": "0:35:24", "remaining_time": "0:28:44", "throughput": 5751.02, "total_tokens": 12218928} {"current_steps": 18730, "total_steps": 33920, "loss": 0.3451, "lr": 4.962438727296527e-06, "epoch": 11.043632075471699, "percentage": 55.22, "elapsed_time": "0:35:25", "remaining_time": "0:28:43", "throughput": 5751.15, "total_tokens": 12222032} {"current_steps": 18735, "total_steps": 33920, "loss": 0.4006, "lr": 4.959866090867897e-06, "epoch": 11.046580188679245, "percentage": 55.23, "elapsed_time": "0:35:25", "remaining_time": "0:28:42", "throughput": 5751.08, "total_tokens": 12225104} {"current_steps": 18740, "total_steps": 33920, "loss": 0.3898, "lr": 4.957293465064893e-06, "epoch": 11.049528301886792, "percentage": 55.25, "elapsed_time": "0:35:26", "remaining_time": "0:28:42", "throughput": 5751.0, "total_tokens": 12227824} {"current_steps": 18745, "total_steps": 33920, "loss": 0.3607, "lr": 4.954720850568627e-06, "epoch": 11.05247641509434, "percentage": 55.26, "elapsed_time": "0:35:26", "remaining_time": "0:28:41", "throughput": 5750.92, "total_tokens": 12230448} {"current_steps": 18750, "total_steps": 33920, "loss": 0.3053, "lr": 4.952148248060212e-06, "epoch": 11.055424528301886, "percentage": 55.28, "elapsed_time": "0:35:27", "remaining_time": "0:28:41", "throughput": 5750.96, "total_tokens": 12233776} {"current_steps": 18755, "total_steps": 33920, "loss": 0.2564, "lr": 4.949575658220755e-06, "epoch": 11.058372641509434, "percentage": 55.29, "elapsed_time": "0:35:27", "remaining_time": "0:28:40", "throughput": 5750.73, "total_tokens": 12236240} {"current_steps": 18760, "total_steps": 33920, "loss": 0.4753, "lr": 4.947003081731359e-06, "epoch": 11.06132075471698, "percentage": 55.31, "elapsed_time": "0:35:28", "remaining_time": "0:28:39", "throughput": 5750.87, "total_tokens": 12239504} {"current_steps": 18765, "total_steps": 33920, "loss": 0.3391, "lr": 4.944430519273126e-06, "epoch": 11.064268867924529, "percentage": 55.32, "elapsed_time": "0:35:28", "remaining_time": "0:28:39", "throughput": 5750.85, "total_tokens": 12242416} {"current_steps": 18770, "total_steps": 33920, "loss": 0.4231, "lr": 4.941857971527152e-06, "epoch": 11.067216981132075, "percentage": 55.34, "elapsed_time": "0:35:29", "remaining_time": "0:28:38", "throughput": 5750.97, "total_tokens": 12246192} {"current_steps": 18775, "total_steps": 33920, "loss": 0.3938, "lr": 4.93928543917453e-06, "epoch": 11.070165094339623, "percentage": 55.35, "elapsed_time": "0:35:30", "remaining_time": "0:28:38", "throughput": 5751.21, "total_tokens": 12250096} {"current_steps": 18780, "total_steps": 33920, "loss": 0.4379, "lr": 4.93671292289635e-06, "epoch": 11.07311320754717, "percentage": 55.37, "elapsed_time": "0:35:30", "remaining_time": "0:28:37", "throughput": 5751.5, "total_tokens": 12254032} {"current_steps": 18785, "total_steps": 33920, "loss": 0.3173, "lr": 4.934140423373698e-06, "epoch": 11.076061320754716, "percentage": 55.38, "elapsed_time": "0:35:31", "remaining_time": "0:28:37", "throughput": 5751.65, "total_tokens": 12257424} {"current_steps": 18790, "total_steps": 33920, "loss": 0.263, "lr": 4.931567941287651e-06, "epoch": 11.079009433962264, "percentage": 55.4, "elapsed_time": "0:35:31", "remaining_time": "0:28:36", "throughput": 5751.85, "total_tokens": 12260944} {"current_steps": 18795, "total_steps": 33920, "loss": 0.3273, "lr": 4.9289954773192875e-06, "epoch": 11.08195754716981, "percentage": 55.41, "elapsed_time": "0:35:32", "remaining_time": "0:28:35", "throughput": 5751.52, "total_tokens": 12263056} {"current_steps": 18800, "total_steps": 33920, "loss": 0.2669, "lr": 4.926423032149677e-06, "epoch": 11.084905660377359, "percentage": 55.42, "elapsed_time": "0:35:32", "remaining_time": "0:28:35", "throughput": 5751.58, "total_tokens": 12266480} {"current_steps": 18805, "total_steps": 33920, "loss": 0.3957, "lr": 4.923850606459883e-06, "epoch": 11.087853773584905, "percentage": 55.44, "elapsed_time": "0:35:33", "remaining_time": "0:28:34", "throughput": 5751.55, "total_tokens": 12269328} {"current_steps": 18810, "total_steps": 33920, "loss": 0.2954, "lr": 4.921278200930972e-06, "epoch": 11.090801886792454, "percentage": 55.45, "elapsed_time": "0:35:33", "remaining_time": "0:28:33", "throughput": 5751.31, "total_tokens": 12271408} {"current_steps": 18815, "total_steps": 33920, "loss": 0.4298, "lr": 4.918705816243996e-06, "epoch": 11.09375, "percentage": 55.47, "elapsed_time": "0:35:34", "remaining_time": "0:28:33", "throughput": 5751.33, "total_tokens": 12274384} {"current_steps": 18820, "total_steps": 33920, "loss": 0.3106, "lr": 4.916133453080007e-06, "epoch": 11.096698113207546, "percentage": 55.48, "elapsed_time": "0:35:34", "remaining_time": "0:28:32", "throughput": 5751.38, "total_tokens": 12277648} {"current_steps": 18825, "total_steps": 33920, "loss": 0.4145, "lr": 4.913561112120046e-06, "epoch": 11.099646226415095, "percentage": 55.5, "elapsed_time": "0:35:35", "remaining_time": "0:28:32", "throughput": 5751.72, "total_tokens": 12282096} {"current_steps": 18830, "total_steps": 33920, "loss": 0.4101, "lr": 4.910988794045154e-06, "epoch": 11.102594339622641, "percentage": 55.51, "elapsed_time": "0:35:35", "remaining_time": "0:28:31", "throughput": 5751.66, "total_tokens": 12284912} {"current_steps": 18835, "total_steps": 33920, "loss": 0.3242, "lr": 4.9084164995363626e-06, "epoch": 11.10554245283019, "percentage": 55.53, "elapsed_time": "0:35:36", "remaining_time": "0:28:31", "throughput": 5751.66, "total_tokens": 12287824} {"current_steps": 18840, "total_steps": 33920, "loss": 0.4541, "lr": 4.905844229274697e-06, "epoch": 11.108490566037736, "percentage": 55.54, "elapsed_time": "0:35:36", "remaining_time": "0:28:30", "throughput": 5751.76, "total_tokens": 12291152} {"current_steps": 18845, "total_steps": 33920, "loss": 0.3456, "lr": 4.903271983941177e-06, "epoch": 11.111438679245284, "percentage": 55.56, "elapsed_time": "0:35:37", "remaining_time": "0:28:29", "throughput": 5751.76, "total_tokens": 12293904} {"current_steps": 18850, "total_steps": 33920, "loss": 0.3313, "lr": 4.900699764216818e-06, "epoch": 11.11438679245283, "percentage": 55.57, "elapsed_time": "0:35:37", "remaining_time": "0:28:29", "throughput": 5751.55, "total_tokens": 12296432} {"current_steps": 18855, "total_steps": 33920, "loss": 0.3298, "lr": 4.898127570782622e-06, "epoch": 11.117334905660377, "percentage": 55.59, "elapsed_time": "0:35:38", "remaining_time": "0:28:28", "throughput": 5751.47, "total_tokens": 12299376} {"current_steps": 18860, "total_steps": 33920, "loss": 0.3568, "lr": 4.895555404319592e-06, "epoch": 11.120283018867925, "percentage": 55.6, "elapsed_time": "0:35:38", "remaining_time": "0:28:27", "throughput": 5751.26, "total_tokens": 12301712} {"current_steps": 18865, "total_steps": 33920, "loss": 0.4002, "lr": 4.89298326550872e-06, "epoch": 11.123231132075471, "percentage": 55.62, "elapsed_time": "0:35:39", "remaining_time": "0:28:27", "throughput": 5751.07, "total_tokens": 12304496} {"current_steps": 18870, "total_steps": 33920, "loss": 0.4819, "lr": 4.8904111550309876e-06, "epoch": 11.12617924528302, "percentage": 55.63, "elapsed_time": "0:35:40", "remaining_time": "0:28:26", "throughput": 5750.96, "total_tokens": 12307344} {"current_steps": 18875, "total_steps": 33920, "loss": 0.3284, "lr": 4.8878390735673755e-06, "epoch": 11.129127358490566, "percentage": 55.65, "elapsed_time": "0:35:40", "remaining_time": "0:28:26", "throughput": 5750.97, "total_tokens": 12310576} {"current_steps": 18880, "total_steps": 33920, "loss": 0.324, "lr": 4.8852670217988505e-06, "epoch": 11.132075471698114, "percentage": 55.66, "elapsed_time": "0:35:41", "remaining_time": "0:28:25", "throughput": 5751.19, "total_tokens": 12315120} {"current_steps": 18885, "total_steps": 33920, "loss": 0.3037, "lr": 4.882695000406377e-06, "epoch": 11.13502358490566, "percentage": 55.68, "elapsed_time": "0:35:41", "remaining_time": "0:28:25", "throughput": 5751.15, "total_tokens": 12318320} {"current_steps": 18890, "total_steps": 33920, "loss": 0.344, "lr": 4.880123010070909e-06, "epoch": 11.137971698113208, "percentage": 55.69, "elapsed_time": "0:35:42", "remaining_time": "0:28:24", "throughput": 5751.11, "total_tokens": 12321328} {"current_steps": 18895, "total_steps": 33920, "loss": 0.2915, "lr": 4.877551051473388e-06, "epoch": 11.140919811320755, "percentage": 55.7, "elapsed_time": "0:35:42", "remaining_time": "0:28:24", "throughput": 5751.07, "total_tokens": 12324432} {"current_steps": 18900, "total_steps": 33920, "loss": 0.4132, "lr": 4.874979125294755e-06, "epoch": 11.143867924528301, "percentage": 55.72, "elapsed_time": "0:35:43", "remaining_time": "0:28:23", "throughput": 5751.09, "total_tokens": 12327632} {"current_steps": 18905, "total_steps": 33920, "loss": 0.4083, "lr": 4.872407232215937e-06, "epoch": 11.14681603773585, "percentage": 55.73, "elapsed_time": "0:35:44", "remaining_time": "0:28:22", "throughput": 5751.03, "total_tokens": 12330544} {"current_steps": 18910, "total_steps": 33920, "loss": 0.3859, "lr": 4.8698353729178546e-06, "epoch": 11.149764150943396, "percentage": 55.75, "elapsed_time": "0:35:44", "remaining_time": "0:28:22", "throughput": 5751.06, "total_tokens": 12333968} {"current_steps": 18915, "total_steps": 33920, "loss": 0.3358, "lr": 4.867263548081418e-06, "epoch": 11.152712264150944, "percentage": 55.76, "elapsed_time": "0:35:45", "remaining_time": "0:28:21", "throughput": 5751.02, "total_tokens": 12337104} {"current_steps": 18920, "total_steps": 33920, "loss": 0.236, "lr": 4.8646917583875304e-06, "epoch": 11.15566037735849, "percentage": 55.78, "elapsed_time": "0:35:45", "remaining_time": "0:28:21", "throughput": 5751.15, "total_tokens": 12340656} {"current_steps": 18925, "total_steps": 33920, "loss": 0.4384, "lr": 4.862120004517082e-06, "epoch": 11.158608490566039, "percentage": 55.79, "elapsed_time": "0:35:46", "remaining_time": "0:28:20", "throughput": 5751.16, "total_tokens": 12344304} {"current_steps": 18930, "total_steps": 33920, "loss": 0.294, "lr": 4.859548287150956e-06, "epoch": 11.161556603773585, "percentage": 55.81, "elapsed_time": "0:35:47", "remaining_time": "0:28:20", "throughput": 5751.56, "total_tokens": 12350800} {"current_steps": 18935, "total_steps": 33920, "loss": 0.3419, "lr": 4.8569766069700275e-06, "epoch": 11.164504716981131, "percentage": 55.82, "elapsed_time": "0:35:47", "remaining_time": "0:28:19", "throughput": 5751.6, "total_tokens": 12354096} {"current_steps": 18940, "total_steps": 33920, "loss": 0.3323, "lr": 4.854404964655158e-06, "epoch": 11.16745283018868, "percentage": 55.84, "elapsed_time": "0:35:48", "remaining_time": "0:28:19", "throughput": 5751.65, "total_tokens": 12357520} {"current_steps": 18945, "total_steps": 33920, "loss": 0.2989, "lr": 4.8518333608872015e-06, "epoch": 11.170400943396226, "percentage": 55.85, "elapsed_time": "0:35:49", "remaining_time": "0:28:18", "throughput": 5751.54, "total_tokens": 12360592} {"current_steps": 18950, "total_steps": 33920, "loss": 0.4278, "lr": 4.849261796347002e-06, "epoch": 11.173349056603774, "percentage": 55.87, "elapsed_time": "0:35:49", "remaining_time": "0:28:18", "throughput": 5751.35, "total_tokens": 12363120} {"current_steps": 18955, "total_steps": 33920, "loss": 0.3995, "lr": 4.846690271715391e-06, "epoch": 11.17629716981132, "percentage": 55.88, "elapsed_time": "0:35:50", "remaining_time": "0:28:17", "throughput": 5751.47, "total_tokens": 12366896} {"current_steps": 18960, "total_steps": 33920, "loss": 0.4895, "lr": 4.844118787673191e-06, "epoch": 11.179245283018869, "percentage": 55.9, "elapsed_time": "0:35:50", "remaining_time": "0:28:17", "throughput": 5751.52, "total_tokens": 12370096} {"current_steps": 18965, "total_steps": 33920, "loss": 0.2992, "lr": 4.841547344901214e-06, "epoch": 11.182193396226415, "percentage": 55.91, "elapsed_time": "0:35:51", "remaining_time": "0:28:16", "throughput": 5751.69, "total_tokens": 12373808} {"current_steps": 18970, "total_steps": 33920, "loss": 0.3822, "lr": 4.838975944080261e-06, "epoch": 11.185141509433961, "percentage": 55.93, "elapsed_time": "0:35:51", "remaining_time": "0:28:15", "throughput": 5751.98, "total_tokens": 12378064} {"current_steps": 18975, "total_steps": 33920, "loss": 0.3382, "lr": 4.83640458589112e-06, "epoch": 11.18808962264151, "percentage": 55.94, "elapsed_time": "0:35:52", "remaining_time": "0:28:15", "throughput": 5752.19, "total_tokens": 12381744} {"current_steps": 18980, "total_steps": 33920, "loss": 0.3703, "lr": 4.833833271014571e-06, "epoch": 11.191037735849056, "percentage": 55.96, "elapsed_time": "0:35:53", "remaining_time": "0:28:14", "throughput": 5752.11, "total_tokens": 12384656} {"current_steps": 18985, "total_steps": 33920, "loss": 0.3804, "lr": 4.831262000131379e-06, "epoch": 11.193985849056604, "percentage": 55.97, "elapsed_time": "0:35:53", "remaining_time": "0:28:14", "throughput": 5752.29, "total_tokens": 12388336} {"current_steps": 18990, "total_steps": 33920, "loss": 0.2396, "lr": 4.828690773922299e-06, "epoch": 11.19693396226415, "percentage": 55.98, "elapsed_time": "0:35:54", "remaining_time": "0:28:13", "throughput": 5751.98, "total_tokens": 12390704} {"current_steps": 18995, "total_steps": 33920, "loss": 0.238, "lr": 4.826119593068074e-06, "epoch": 11.199882075471699, "percentage": 56.0, "elapsed_time": "0:35:54", "remaining_time": "0:28:13", "throughput": 5752.3, "total_tokens": 12395024} {"current_steps": 19000, "total_steps": 33920, "loss": 0.3546, "lr": 4.8235484582494375e-06, "epoch": 11.202830188679245, "percentage": 56.01, "elapsed_time": "0:35:55", "remaining_time": "0:28:12", "throughput": 5752.3, "total_tokens": 12398192} {"current_steps": 19005, "total_steps": 33920, "loss": 0.6617, "lr": 4.8209773701471076e-06, "epoch": 11.205778301886792, "percentage": 56.03, "elapsed_time": "0:35:55", "remaining_time": "0:28:11", "throughput": 5752.31, "total_tokens": 12401392} {"current_steps": 19010, "total_steps": 33920, "loss": 0.5045, "lr": 4.818406329441789e-06, "epoch": 11.20872641509434, "percentage": 56.04, "elapsed_time": "0:35:56", "remaining_time": "0:28:11", "throughput": 5752.36, "total_tokens": 12404912} {"current_steps": 19015, "total_steps": 33920, "loss": 0.4558, "lr": 4.815835336814179e-06, "epoch": 11.211674528301886, "percentage": 56.06, "elapsed_time": "0:35:57", "remaining_time": "0:28:11", "throughput": 5752.77, "total_tokens": 12411408} {"current_steps": 19020, "total_steps": 33920, "loss": 0.3711, "lr": 4.813264392944957e-06, "epoch": 11.214622641509434, "percentage": 56.07, "elapsed_time": "0:35:58", "remaining_time": "0:28:10", "throughput": 5752.64, "total_tokens": 12414480} {"current_steps": 19025, "total_steps": 33920, "loss": 0.285, "lr": 4.8106934985147905e-06, "epoch": 11.21757075471698, "percentage": 56.09, "elapsed_time": "0:35:58", "remaining_time": "0:28:10", "throughput": 5752.65, "total_tokens": 12418160} {"current_steps": 19030, "total_steps": 33920, "loss": 0.3588, "lr": 4.808122654204338e-06, "epoch": 11.220518867924529, "percentage": 56.1, "elapsed_time": "0:35:59", "remaining_time": "0:28:09", "throughput": 5752.58, "total_tokens": 12421360} {"current_steps": 19035, "total_steps": 33920, "loss": 0.4009, "lr": 4.805551860694239e-06, "epoch": 11.223466981132075, "percentage": 56.12, "elapsed_time": "0:35:59", "remaining_time": "0:28:08", "throughput": 5752.36, "total_tokens": 12423888} {"current_steps": 19040, "total_steps": 33920, "loss": 0.3855, "lr": 4.802981118665122e-06, "epoch": 11.226415094339623, "percentage": 56.13, "elapsed_time": "0:36:00", "remaining_time": "0:28:08", "throughput": 5752.62, "total_tokens": 12428208} {"current_steps": 19045, "total_steps": 33920, "loss": 0.4328, "lr": 4.800410428797604e-06, "epoch": 11.22936320754717, "percentage": 56.15, "elapsed_time": "0:36:00", "remaining_time": "0:28:07", "throughput": 5752.7, "total_tokens": 12431568} {"current_steps": 19050, "total_steps": 33920, "loss": 0.3515, "lr": 4.797839791772286e-06, "epoch": 11.232311320754716, "percentage": 56.16, "elapsed_time": "0:36:01", "remaining_time": "0:28:07", "throughput": 5752.69, "total_tokens": 12434384} {"current_steps": 19055, "total_steps": 33920, "loss": 0.3832, "lr": 4.795269208269752e-06, "epoch": 11.235259433962264, "percentage": 56.18, "elapsed_time": "0:36:02", "remaining_time": "0:28:06", "throughput": 5752.41, "total_tokens": 12436784} {"current_steps": 19060, "total_steps": 33920, "loss": 0.3189, "lr": 4.792698678970579e-06, "epoch": 11.23820754716981, "percentage": 56.19, "elapsed_time": "0:36:02", "remaining_time": "0:28:06", "throughput": 5752.61, "total_tokens": 12440592} {"current_steps": 19065, "total_steps": 33920, "loss": 0.3805, "lr": 4.7901282045553245e-06, "epoch": 11.241155660377359, "percentage": 56.21, "elapsed_time": "0:36:03", "remaining_time": "0:28:05", "throughput": 5752.52, "total_tokens": 12443344} {"current_steps": 19070, "total_steps": 33920, "loss": 0.4064, "lr": 4.787557785704531e-06, "epoch": 11.244103773584905, "percentage": 56.22, "elapsed_time": "0:36:03", "remaining_time": "0:28:04", "throughput": 5752.62, "total_tokens": 12446736} {"current_steps": 19075, "total_steps": 33920, "loss": 0.3028, "lr": 4.784987423098731e-06, "epoch": 11.247051886792454, "percentage": 56.24, "elapsed_time": "0:36:04", "remaining_time": "0:28:04", "throughput": 5752.68, "total_tokens": 12450128} {"current_steps": 19080, "total_steps": 33920, "loss": 0.3516, "lr": 4.7824171174184354e-06, "epoch": 11.25, "percentage": 56.25, "elapsed_time": "0:36:04", "remaining_time": "0:28:03", "throughput": 5752.53, "total_tokens": 12452976} {"current_steps": 19085, "total_steps": 33920, "loss": 0.3235, "lr": 4.779846869344146e-06, "epoch": 11.252948113207546, "percentage": 56.26, "elapsed_time": "0:36:05", "remaining_time": "0:28:03", "throughput": 5752.56, "total_tokens": 12455984} {"current_steps": 19090, "total_steps": 33920, "loss": 0.2961, "lr": 4.777276679556346e-06, "epoch": 11.255896226415095, "percentage": 56.28, "elapsed_time": "0:36:05", "remaining_time": "0:28:02", "throughput": 5752.52, "total_tokens": 12459088} {"current_steps": 19095, "total_steps": 33920, "loss": 0.3704, "lr": 4.774706548735507e-06, "epoch": 11.258844339622641, "percentage": 56.29, "elapsed_time": "0:36:06", "remaining_time": "0:28:01", "throughput": 5752.32, "total_tokens": 12461712} {"current_steps": 19100, "total_steps": 33920, "loss": 0.3257, "lr": 4.77213647756208e-06, "epoch": 11.26179245283019, "percentage": 56.31, "elapsed_time": "0:36:06", "remaining_time": "0:28:01", "throughput": 5752.4, "total_tokens": 12465072} {"current_steps": 19105, "total_steps": 33920, "loss": 0.3267, "lr": 4.769566466716501e-06, "epoch": 11.264740566037736, "percentage": 56.32, "elapsed_time": "0:36:07", "remaining_time": "0:28:00", "throughput": 5752.42, "total_tokens": 12467984} {"current_steps": 19110, "total_steps": 33920, "loss": 0.5089, "lr": 4.766996516879195e-06, "epoch": 11.267688679245284, "percentage": 56.34, "elapsed_time": "0:36:07", "remaining_time": "0:28:00", "throughput": 5752.5, "total_tokens": 12471280} {"current_steps": 19115, "total_steps": 33920, "loss": 0.4872, "lr": 4.764426628730564e-06, "epoch": 11.27063679245283, "percentage": 56.35, "elapsed_time": "0:36:08", "remaining_time": "0:27:59", "throughput": 5752.61, "total_tokens": 12474736} {"current_steps": 19120, "total_steps": 33920, "loss": 0.2715, "lr": 4.761856802950999e-06, "epoch": 11.273584905660377, "percentage": 56.37, "elapsed_time": "0:36:09", "remaining_time": "0:27:58", "throughput": 5752.77, "total_tokens": 12478064} {"current_steps": 19125, "total_steps": 33920, "loss": 0.5084, "lr": 4.759287040220872e-06, "epoch": 11.276533018867925, "percentage": 56.38, "elapsed_time": "0:36:09", "remaining_time": "0:27:58", "throughput": 5752.82, "total_tokens": 12480944} {"current_steps": 19130, "total_steps": 33920, "loss": 0.2879, "lr": 4.756717341220538e-06, "epoch": 11.279481132075471, "percentage": 56.4, "elapsed_time": "0:36:10", "remaining_time": "0:27:57", "throughput": 5752.79, "total_tokens": 12483728} {"current_steps": 19135, "total_steps": 33920, "loss": 0.4629, "lr": 4.7541477066303365e-06, "epoch": 11.28242924528302, "percentage": 56.41, "elapsed_time": "0:36:10", "remaining_time": "0:27:57", "throughput": 5752.64, "total_tokens": 12486160} {"current_steps": 19140, "total_steps": 33920, "loss": 0.3607, "lr": 4.75157813713059e-06, "epoch": 11.285377358490566, "percentage": 56.43, "elapsed_time": "0:36:11", "remaining_time": "0:27:56", "throughput": 5752.75, "total_tokens": 12489744} {"current_steps": 19145, "total_steps": 33920, "loss": 0.3728, "lr": 4.7490086334016e-06, "epoch": 11.288325471698114, "percentage": 56.44, "elapsed_time": "0:36:11", "remaining_time": "0:27:55", "throughput": 5752.66, "total_tokens": 12492304} {"current_steps": 19150, "total_steps": 33920, "loss": 0.319, "lr": 4.746439196123659e-06, "epoch": 11.29127358490566, "percentage": 56.46, "elapsed_time": "0:36:12", "remaining_time": "0:27:55", "throughput": 5752.89, "total_tokens": 12496144} {"current_steps": 19155, "total_steps": 33920, "loss": 0.3354, "lr": 4.743869825977032e-06, "epoch": 11.294221698113208, "percentage": 56.47, "elapsed_time": "0:36:12", "remaining_time": "0:27:54", "throughput": 5752.82, "total_tokens": 12499152} {"current_steps": 19160, "total_steps": 33920, "loss": 0.3769, "lr": 4.741300523641972e-06, "epoch": 11.297169811320755, "percentage": 56.49, "elapsed_time": "0:36:13", "remaining_time": "0:27:54", "throughput": 5752.48, "total_tokens": 12501168} {"current_steps": 19165, "total_steps": 33920, "loss": 0.3989, "lr": 4.738731289798715e-06, "epoch": 11.300117924528301, "percentage": 56.5, "elapsed_time": "0:36:13", "remaining_time": "0:27:53", "throughput": 5752.57, "total_tokens": 12504240} {"current_steps": 19170, "total_steps": 33920, "loss": 0.4335, "lr": 4.7361621251274744e-06, "epoch": 11.30306603773585, "percentage": 56.52, "elapsed_time": "0:36:14", "remaining_time": "0:27:52", "throughput": 5752.72, "total_tokens": 12507952} {"current_steps": 19175, "total_steps": 33920, "loss": 0.4033, "lr": 4.733593030308446e-06, "epoch": 11.306014150943396, "percentage": 56.53, "elapsed_time": "0:36:14", "remaining_time": "0:27:52", "throughput": 5752.82, "total_tokens": 12511536} {"current_steps": 19180, "total_steps": 33920, "loss": 0.3032, "lr": 4.731024006021814e-06, "epoch": 11.308962264150944, "percentage": 56.54, "elapsed_time": "0:36:15", "remaining_time": "0:27:51", "throughput": 5752.71, "total_tokens": 12514256} {"current_steps": 19185, "total_steps": 33920, "loss": 0.332, "lr": 4.728455052947732e-06, "epoch": 11.31191037735849, "percentage": 56.56, "elapsed_time": "0:36:15", "remaining_time": "0:27:51", "throughput": 5752.9, "total_tokens": 12517936} {"current_steps": 19190, "total_steps": 33920, "loss": 0.3474, "lr": 4.725886171766349e-06, "epoch": 11.314858490566039, "percentage": 56.57, "elapsed_time": "0:36:16", "remaining_time": "0:27:50", "throughput": 5752.87, "total_tokens": 12520784} {"current_steps": 19195, "total_steps": 33920, "loss": 0.2432, "lr": 4.723317363157781e-06, "epoch": 11.317806603773585, "percentage": 56.59, "elapsed_time": "0:36:16", "remaining_time": "0:27:50", "throughput": 5752.99, "total_tokens": 12524016} {"current_steps": 19200, "total_steps": 33920, "loss": 0.3114, "lr": 4.720748627802135e-06, "epoch": 11.320754716981131, "percentage": 56.6, "elapsed_time": "0:36:17", "remaining_time": "0:27:49", "throughput": 5752.91, "total_tokens": 12526960} {"current_steps": 19205, "total_steps": 33920, "loss": 0.3086, "lr": 4.718179966379492e-06, "epoch": 11.32370283018868, "percentage": 56.62, "elapsed_time": "0:36:18", "remaining_time": "0:27:48", "throughput": 5753.15, "total_tokens": 12530736} {"current_steps": 19210, "total_steps": 33920, "loss": 0.299, "lr": 4.715611379569919e-06, "epoch": 11.326650943396226, "percentage": 56.63, "elapsed_time": "0:36:18", "remaining_time": "0:27:48", "throughput": 5753.0, "total_tokens": 12533520} {"current_steps": 19215, "total_steps": 33920, "loss": 0.3886, "lr": 4.713042868053458e-06, "epoch": 11.329599056603774, "percentage": 56.65, "elapsed_time": "0:36:19", "remaining_time": "0:27:47", "throughput": 5753.09, "total_tokens": 12536656} {"current_steps": 19220, "total_steps": 33920, "loss": 0.4137, "lr": 4.7104744325101345e-06, "epoch": 11.33254716981132, "percentage": 56.66, "elapsed_time": "0:36:19", "remaining_time": "0:27:47", "throughput": 5753.15, "total_tokens": 12540112} {"current_steps": 19225, "total_steps": 33920, "loss": 0.2594, "lr": 4.7079060736199525e-06, "epoch": 11.335495283018869, "percentage": 56.68, "elapsed_time": "0:36:20", "remaining_time": "0:27:46", "throughput": 5752.88, "total_tokens": 12542640} {"current_steps": 19230, "total_steps": 33920, "loss": 0.3725, "lr": 4.705337792062897e-06, "epoch": 11.338443396226415, "percentage": 56.69, "elapsed_time": "0:36:20", "remaining_time": "0:27:45", "throughput": 5752.8, "total_tokens": 12545808} {"current_steps": 19235, "total_steps": 33920, "loss": 0.4459, "lr": 4.702769588518931e-06, "epoch": 11.341391509433961, "percentage": 56.71, "elapsed_time": "0:36:21", "remaining_time": "0:27:45", "throughput": 5752.74, "total_tokens": 12548528} {"current_steps": 19240, "total_steps": 33920, "loss": 0.427, "lr": 4.700201463667996e-06, "epoch": 11.34433962264151, "percentage": 56.72, "elapsed_time": "0:36:21", "remaining_time": "0:27:44", "throughput": 5752.77, "total_tokens": 12551792} {"current_steps": 19245, "total_steps": 33920, "loss": 0.4721, "lr": 4.697633418190017e-06, "epoch": 11.347287735849056, "percentage": 56.74, "elapsed_time": "0:36:22", "remaining_time": "0:27:44", "throughput": 5752.72, "total_tokens": 12555184} {"current_steps": 19250, "total_steps": 33920, "loss": 0.4315, "lr": 4.695065452764893e-06, "epoch": 11.350235849056604, "percentage": 56.75, "elapsed_time": "0:36:22", "remaining_time": "0:27:43", "throughput": 5752.75, "total_tokens": 12558160} {"current_steps": 19255, "total_steps": 33920, "loss": 0.333, "lr": 4.692497568072505e-06, "epoch": 11.35318396226415, "percentage": 56.77, "elapsed_time": "0:36:23", "remaining_time": "0:27:43", "throughput": 5752.78, "total_tokens": 12562000} {"current_steps": 19260, "total_steps": 33920, "loss": 0.3627, "lr": 4.689929764792711e-06, "epoch": 11.356132075471699, "percentage": 56.78, "elapsed_time": "0:36:24", "remaining_time": "0:27:42", "throughput": 5752.65, "total_tokens": 12564720} {"current_steps": 19265, "total_steps": 33920, "loss": 0.385, "lr": 4.687362043605349e-06, "epoch": 11.359080188679245, "percentage": 56.8, "elapsed_time": "0:36:24", "remaining_time": "0:27:41", "throughput": 5752.81, "total_tokens": 12568208} {"current_steps": 19270, "total_steps": 33920, "loss": 0.3423, "lr": 4.684794405190231e-06, "epoch": 11.362028301886792, "percentage": 56.81, "elapsed_time": "0:36:25", "remaining_time": "0:27:41", "throughput": 5752.74, "total_tokens": 12571152} {"current_steps": 19275, "total_steps": 33920, "loss": 0.3624, "lr": 4.682226850227155e-06, "epoch": 11.36497641509434, "percentage": 56.82, "elapsed_time": "0:36:25", "remaining_time": "0:27:40", "throughput": 5752.88, "total_tokens": 12574896} {"current_steps": 19280, "total_steps": 33920, "loss": 0.3234, "lr": 4.6796593793958875e-06, "epoch": 11.367924528301886, "percentage": 56.84, "elapsed_time": "0:36:26", "remaining_time": "0:27:40", "throughput": 5752.98, "total_tokens": 12578384} {"current_steps": 19285, "total_steps": 33920, "loss": 0.337, "lr": 4.6770919933761815e-06, "epoch": 11.370872641509434, "percentage": 56.85, "elapsed_time": "0:36:26", "remaining_time": "0:27:39", "throughput": 5752.86, "total_tokens": 12581168} {"current_steps": 19290, "total_steps": 33920, "loss": 0.4259, "lr": 4.6745246928477615e-06, "epoch": 11.37382075471698, "percentage": 56.87, "elapsed_time": "0:36:27", "remaining_time": "0:27:39", "throughput": 5752.9, "total_tokens": 12584272} {"current_steps": 19295, "total_steps": 33920, "loss": 0.5189, "lr": 4.671957478490332e-06, "epoch": 11.376768867924529, "percentage": 56.88, "elapsed_time": "0:36:27", "remaining_time": "0:27:38", "throughput": 5752.98, "total_tokens": 12587440} {"current_steps": 19300, "total_steps": 33920, "loss": 0.6201, "lr": 4.669390350983574e-06, "epoch": 11.379716981132075, "percentage": 56.9, "elapsed_time": "0:36:28", "remaining_time": "0:27:37", "throughput": 5753.24, "total_tokens": 12592208} {"current_steps": 19305, "total_steps": 33920, "loss": 0.2941, "lr": 4.666823311007145e-06, "epoch": 11.382665094339623, "percentage": 56.91, "elapsed_time": "0:36:29", "remaining_time": "0:27:37", "throughput": 5753.28, "total_tokens": 12595504} {"current_steps": 19310, "total_steps": 33920, "loss": 0.3889, "lr": 4.664256359240681e-06, "epoch": 11.38561320754717, "percentage": 56.93, "elapsed_time": "0:36:29", "remaining_time": "0:27:36", "throughput": 5753.06, "total_tokens": 12597776} {"current_steps": 19315, "total_steps": 33920, "loss": 0.2552, "lr": 4.661689496363793e-06, "epoch": 11.388561320754716, "percentage": 56.94, "elapsed_time": "0:36:30", "remaining_time": "0:27:36", "throughput": 5752.9, "total_tokens": 12600368} {"current_steps": 19320, "total_steps": 33920, "loss": 0.32, "lr": 4.659122723056068e-06, "epoch": 11.391509433962264, "percentage": 56.96, "elapsed_time": "0:36:30", "remaining_time": "0:27:35", "throughput": 5753.03, "total_tokens": 12603664} {"current_steps": 19325, "total_steps": 33920, "loss": 0.3748, "lr": 4.656556039997072e-06, "epoch": 11.39445754716981, "percentage": 56.97, "elapsed_time": "0:36:31", "remaining_time": "0:27:34", "throughput": 5752.94, "total_tokens": 12606544} {"current_steps": 19330, "total_steps": 33920, "loss": 0.3998, "lr": 4.653989447866345e-06, "epoch": 11.397405660377359, "percentage": 56.99, "elapsed_time": "0:36:31", "remaining_time": "0:27:34", "throughput": 5753.09, "total_tokens": 12610160} {"current_steps": 19335, "total_steps": 33920, "loss": 0.29, "lr": 4.651422947343401e-06, "epoch": 11.400353773584905, "percentage": 57.0, "elapsed_time": "0:36:32", "remaining_time": "0:27:33", "throughput": 5753.22, "total_tokens": 12613584} {"current_steps": 19340, "total_steps": 33920, "loss": 0.2793, "lr": 4.6488565391077355e-06, "epoch": 11.403301886792454, "percentage": 57.02, "elapsed_time": "0:36:32", "remaining_time": "0:27:33", "throughput": 5753.23, "total_tokens": 12616560} {"current_steps": 19345, "total_steps": 33920, "loss": 0.3551, "lr": 4.646290223838815e-06, "epoch": 11.40625, "percentage": 57.03, "elapsed_time": "0:36:33", "remaining_time": "0:27:32", "throughput": 5753.02, "total_tokens": 12619184} {"current_steps": 19350, "total_steps": 33920, "loss": 0.4112, "lr": 4.64372400221608e-06, "epoch": 11.409198113207546, "percentage": 57.05, "elapsed_time": "0:36:34", "remaining_time": "0:27:32", "throughput": 5753.01, "total_tokens": 12622384} {"current_steps": 19355, "total_steps": 33920, "loss": 0.4107, "lr": 4.641157874918953e-06, "epoch": 11.412146226415095, "percentage": 57.06, "elapsed_time": "0:36:34", "remaining_time": "0:27:31", "throughput": 5753.0, "total_tokens": 12625296} {"current_steps": 19360, "total_steps": 33920, "loss": 0.3373, "lr": 4.6385918426268245e-06, "epoch": 11.415094339622641, "percentage": 57.08, "elapsed_time": "0:36:35", "remaining_time": "0:27:30", "throughput": 5753.09, "total_tokens": 12628496} {"current_steps": 19365, "total_steps": 33920, "loss": 0.3276, "lr": 4.636025906019062e-06, "epoch": 11.41804245283019, "percentage": 57.09, "elapsed_time": "0:36:35", "remaining_time": "0:27:30", "throughput": 5753.18, "total_tokens": 12631824} {"current_steps": 19370, "total_steps": 33920, "loss": 0.4927, "lr": 4.6334600657750115e-06, "epoch": 11.420990566037736, "percentage": 57.1, "elapsed_time": "0:36:36", "remaining_time": "0:27:29", "throughput": 5753.11, "total_tokens": 12634672} {"current_steps": 19375, "total_steps": 33920, "loss": 0.4817, "lr": 4.6308943225739855e-06, "epoch": 11.423938679245284, "percentage": 57.12, "elapsed_time": "0:36:36", "remaining_time": "0:27:29", "throughput": 5753.07, "total_tokens": 12637648} {"current_steps": 19380, "total_steps": 33920, "loss": 0.4268, "lr": 4.628328677095281e-06, "epoch": 11.42688679245283, "percentage": 57.13, "elapsed_time": "0:36:37", "remaining_time": "0:27:28", "throughput": 5753.09, "total_tokens": 12640752} {"current_steps": 19385, "total_steps": 33920, "loss": 0.3703, "lr": 4.625763130018159e-06, "epoch": 11.429834905660377, "percentage": 57.15, "elapsed_time": "0:36:37", "remaining_time": "0:27:27", "throughput": 5753.0, "total_tokens": 12643952} {"current_steps": 19390, "total_steps": 33920, "loss": 0.3529, "lr": 4.6231976820218635e-06, "epoch": 11.432783018867925, "percentage": 57.16, "elapsed_time": "0:36:38", "remaining_time": "0:27:27", "throughput": 5753.04, "total_tokens": 12647216} {"current_steps": 19395, "total_steps": 33920, "loss": 0.3568, "lr": 4.620632333785605e-06, "epoch": 11.435731132075471, "percentage": 57.18, "elapsed_time": "0:36:38", "remaining_time": "0:27:26", "throughput": 5753.06, "total_tokens": 12650224} {"current_steps": 19400, "total_steps": 33920, "loss": 0.3297, "lr": 4.618067085988569e-06, "epoch": 11.43867924528302, "percentage": 57.19, "elapsed_time": "0:36:39", "remaining_time": "0:27:26", "throughput": 5753.08, "total_tokens": 12653488} {"current_steps": 19405, "total_steps": 33920, "loss": 0.2986, "lr": 4.615501939309921e-06, "epoch": 11.441627358490566, "percentage": 57.21, "elapsed_time": "0:36:40", "remaining_time": "0:27:25", "throughput": 5753.22, "total_tokens": 12657232} {"current_steps": 19410, "total_steps": 33920, "loss": 0.3339, "lr": 4.612936894428791e-06, "epoch": 11.444575471698114, "percentage": 57.22, "elapsed_time": "0:36:40", "remaining_time": "0:27:25", "throughput": 5753.06, "total_tokens": 12660400} {"current_steps": 19415, "total_steps": 33920, "loss": 0.5552, "lr": 4.610371952024285e-06, "epoch": 11.44752358490566, "percentage": 57.24, "elapsed_time": "0:36:41", "remaining_time": "0:27:24", "throughput": 5753.29, "total_tokens": 12664944} {"current_steps": 19420, "total_steps": 33920, "loss": 0.2934, "lr": 4.607807112775485e-06, "epoch": 11.450471698113208, "percentage": 57.25, "elapsed_time": "0:36:41", "remaining_time": "0:27:24", "throughput": 5753.34, "total_tokens": 12668272} {"current_steps": 19425, "total_steps": 33920, "loss": 0.3197, "lr": 4.605242377361441e-06, "epoch": 11.453419811320755, "percentage": 57.27, "elapsed_time": "0:36:42", "remaining_time": "0:27:23", "throughput": 5753.58, "total_tokens": 12672272} {"current_steps": 19430, "total_steps": 33920, "loss": 0.3842, "lr": 4.60267774646118e-06, "epoch": 11.456367924528301, "percentage": 57.28, "elapsed_time": "0:36:43", "remaining_time": "0:27:22", "throughput": 5753.73, "total_tokens": 12675760} {"current_steps": 19435, "total_steps": 33920, "loss": 0.4433, "lr": 4.600113220753698e-06, "epoch": 11.45931603773585, "percentage": 57.3, "elapsed_time": "0:36:43", "remaining_time": "0:27:22", "throughput": 5753.68, "total_tokens": 12678896} {"current_steps": 19440, "total_steps": 33920, "loss": 0.387, "lr": 4.597548800917964e-06, "epoch": 11.462264150943396, "percentage": 57.31, "elapsed_time": "0:36:44", "remaining_time": "0:27:21", "throughput": 5753.73, "total_tokens": 12682256} {"current_steps": 19445, "total_steps": 33920, "loss": 0.4222, "lr": 4.594984487632919e-06, "epoch": 11.465212264150944, "percentage": 57.33, "elapsed_time": "0:36:44", "remaining_time": "0:27:21", "throughput": 5753.9, "total_tokens": 12686544} {"current_steps": 19450, "total_steps": 33920, "loss": 0.3709, "lr": 4.592420281577478e-06, "epoch": 11.46816037735849, "percentage": 57.34, "elapsed_time": "0:36:45", "remaining_time": "0:27:20", "throughput": 5753.91, "total_tokens": 12689520} {"current_steps": 19455, "total_steps": 33920, "loss": 0.3176, "lr": 4.589856183430521e-06, "epoch": 11.471108490566039, "percentage": 57.36, "elapsed_time": "0:36:45", "remaining_time": "0:27:20", "throughput": 5753.86, "total_tokens": 12692336} {"current_steps": 19460, "total_steps": 33920, "loss": 0.3825, "lr": 4.58729219387091e-06, "epoch": 11.474056603773585, "percentage": 57.37, "elapsed_time": "0:36:46", "remaining_time": "0:27:19", "throughput": 5754.15, "total_tokens": 12696784} {"current_steps": 19465, "total_steps": 33920, "loss": 0.2807, "lr": 4.584728313577468e-06, "epoch": 11.477004716981131, "percentage": 57.39, "elapsed_time": "0:36:47", "remaining_time": "0:27:19", "throughput": 5754.5, "total_tokens": 12701584} {"current_steps": 19470, "total_steps": 33920, "loss": 0.3338, "lr": 4.582164543228993e-06, "epoch": 11.47995283018868, "percentage": 57.4, "elapsed_time": "0:36:47", "remaining_time": "0:27:18", "throughput": 5754.41, "total_tokens": 12704624} {"current_steps": 19475, "total_steps": 33920, "loss": 0.3215, "lr": 4.5796008835042574e-06, "epoch": 11.482900943396226, "percentage": 57.41, "elapsed_time": "0:36:48", "remaining_time": "0:27:18", "throughput": 5754.55, "total_tokens": 12708368} {"current_steps": 19480, "total_steps": 33920, "loss": 0.4306, "lr": 4.577037335082e-06, "epoch": 11.485849056603774, "percentage": 57.43, "elapsed_time": "0:36:49", "remaining_time": "0:27:17", "throughput": 5754.77, "total_tokens": 12712304} {"current_steps": 19485, "total_steps": 33920, "loss": 0.437, "lr": 4.574473898640933e-06, "epoch": 11.48879716981132, "percentage": 57.44, "elapsed_time": "0:36:49", "remaining_time": "0:27:16", "throughput": 5754.75, "total_tokens": 12715600} {"current_steps": 19490, "total_steps": 33920, "loss": 0.358, "lr": 4.571910574859732e-06, "epoch": 11.491745283018869, "percentage": 57.46, "elapsed_time": "0:36:50", "remaining_time": "0:27:16", "throughput": 5754.54, "total_tokens": 12718192} {"current_steps": 19495, "total_steps": 33920, "loss": 0.3712, "lr": 4.5693473644170535e-06, "epoch": 11.494693396226415, "percentage": 57.47, "elapsed_time": "0:36:50", "remaining_time": "0:27:15", "throughput": 5754.89, "total_tokens": 12723344} {"current_steps": 19500, "total_steps": 33920, "loss": 0.395, "lr": 4.566784267991516e-06, "epoch": 11.497641509433961, "percentage": 57.49, "elapsed_time": "0:36:51", "remaining_time": "0:27:15", "throughput": 5754.91, "total_tokens": 12726480} {"current_steps": 19505, "total_steps": 33920, "loss": 0.4189, "lr": 4.564221286261709e-06, "epoch": 11.50058962264151, "percentage": 57.5, "elapsed_time": "0:36:52", "remaining_time": "0:27:14", "throughput": 5754.9, "total_tokens": 12729936} {"current_steps": 19510, "total_steps": 33920, "loss": 0.4949, "lr": 4.5616584199061964e-06, "epoch": 11.503537735849056, "percentage": 57.52, "elapsed_time": "0:36:52", "remaining_time": "0:27:14", "throughput": 5754.79, "total_tokens": 12732560} {"current_steps": 19515, "total_steps": 33920, "loss": 0.3673, "lr": 4.559095669603506e-06, "epoch": 11.506485849056604, "percentage": 57.53, "elapsed_time": "0:36:53", "remaining_time": "0:27:13", "throughput": 5754.95, "total_tokens": 12736592} {"current_steps": 19520, "total_steps": 33920, "loss": 0.2726, "lr": 4.556533036032136e-06, "epoch": 11.50943396226415, "percentage": 57.55, "elapsed_time": "0:36:53", "remaining_time": "0:27:13", "throughput": 5755.03, "total_tokens": 12739824} {"current_steps": 19525, "total_steps": 33920, "loss": 0.3249, "lr": 4.553970519870557e-06, "epoch": 11.512382075471699, "percentage": 57.56, "elapsed_time": "0:36:54", "remaining_time": "0:27:12", "throughput": 5754.98, "total_tokens": 12742864} {"current_steps": 19530, "total_steps": 33920, "loss": 0.3526, "lr": 4.551408121797205e-06, "epoch": 11.515330188679245, "percentage": 57.58, "elapsed_time": "0:36:54", "remaining_time": "0:27:11", "throughput": 5755.15, "total_tokens": 12746480} {"current_steps": 19535, "total_steps": 33920, "loss": 0.3497, "lr": 4.548845842490486e-06, "epoch": 11.518278301886792, "percentage": 57.59, "elapsed_time": "0:36:55", "remaining_time": "0:27:11", "throughput": 5754.96, "total_tokens": 12749104} {"current_steps": 19540, "total_steps": 33920, "loss": 0.2583, "lr": 4.5462836826287745e-06, "epoch": 11.52122641509434, "percentage": 57.61, "elapsed_time": "0:36:55", "remaining_time": "0:27:10", "throughput": 5755.26, "total_tokens": 12753360} {"current_steps": 19545, "total_steps": 33920, "loss": 0.3361, "lr": 4.543721642890414e-06, "epoch": 11.524174528301886, "percentage": 57.62, "elapsed_time": "0:36:56", "remaining_time": "0:27:10", "throughput": 5755.15, "total_tokens": 12756208} {"current_steps": 19550, "total_steps": 33920, "loss": 0.3636, "lr": 4.541159723953714e-06, "epoch": 11.527122641509434, "percentage": 57.64, "elapsed_time": "0:36:56", "remaining_time": "0:27:09", "throughput": 5755.14, "total_tokens": 12759120} {"current_steps": 19555, "total_steps": 33920, "loss": 0.3877, "lr": 4.538597926496955e-06, "epoch": 11.53007075471698, "percentage": 57.65, "elapsed_time": "0:36:57", "remaining_time": "0:27:08", "throughput": 5755.0, "total_tokens": 12761968} {"current_steps": 19560, "total_steps": 33920, "loss": 0.3654, "lr": 4.536036251198384e-06, "epoch": 11.533018867924529, "percentage": 57.67, "elapsed_time": "0:36:58", "remaining_time": "0:27:08", "throughput": 5755.06, "total_tokens": 12765232} {"current_steps": 19565, "total_steps": 33920, "loss": 0.3726, "lr": 4.5334746987362124e-06, "epoch": 11.535966981132075, "percentage": 57.68, "elapsed_time": "0:36:58", "remaining_time": "0:27:07", "throughput": 5755.25, "total_tokens": 12768976} {"current_steps": 19570, "total_steps": 33920, "loss": 0.3561, "lr": 4.530913269788627e-06, "epoch": 11.538915094339622, "percentage": 57.69, "elapsed_time": "0:36:59", "remaining_time": "0:27:07", "throughput": 5755.42, "total_tokens": 12772816} {"current_steps": 19575, "total_steps": 33920, "loss": 0.4169, "lr": 4.528351965033775e-06, "epoch": 11.54186320754717, "percentage": 57.71, "elapsed_time": "0:36:59", "remaining_time": "0:27:06", "throughput": 5755.71, "total_tokens": 12777488} {"current_steps": 19580, "total_steps": 33920, "loss": 0.3557, "lr": 4.525790785149774e-06, "epoch": 11.544811320754716, "percentage": 57.72, "elapsed_time": "0:37:00", "remaining_time": "0:27:06", "throughput": 5755.73, "total_tokens": 12781040} {"current_steps": 19585, "total_steps": 33920, "loss": 0.4655, "lr": 4.523229730814705e-06, "epoch": 11.547759433962264, "percentage": 57.74, "elapsed_time": "0:37:01", "remaining_time": "0:27:05", "throughput": 5755.59, "total_tokens": 12784080} {"current_steps": 19590, "total_steps": 33920, "loss": 0.2927, "lr": 4.52066880270662e-06, "epoch": 11.55070754716981, "percentage": 57.75, "elapsed_time": "0:37:01", "remaining_time": "0:27:05", "throughput": 5755.51, "total_tokens": 12786736} {"current_steps": 19595, "total_steps": 33920, "loss": 0.3374, "lr": 4.518108001503536e-06, "epoch": 11.553655660377359, "percentage": 57.77, "elapsed_time": "0:37:02", "remaining_time": "0:27:04", "throughput": 5755.56, "total_tokens": 12790000} {"current_steps": 19600, "total_steps": 33920, "loss": 0.3287, "lr": 4.515547327883434e-06, "epoch": 11.556603773584905, "percentage": 57.78, "elapsed_time": "0:37:02", "remaining_time": "0:27:03", "throughput": 5755.65, "total_tokens": 12793456} {"current_steps": 19605, "total_steps": 33920, "loss": 0.3315, "lr": 4.512986782524266e-06, "epoch": 11.559551886792454, "percentage": 57.8, "elapsed_time": "0:37:03", "remaining_time": "0:27:03", "throughput": 5755.78, "total_tokens": 12796784} {"current_steps": 19610, "total_steps": 33920, "loss": 0.253, "lr": 4.510426366103946e-06, "epoch": 11.5625, "percentage": 57.81, "elapsed_time": "0:37:03", "remaining_time": "0:27:02", "throughput": 5755.79, "total_tokens": 12799632} {"current_steps": 19615, "total_steps": 33920, "loss": 0.4082, "lr": 4.5078660793003544e-06, "epoch": 11.565448113207546, "percentage": 57.83, "elapsed_time": "0:37:04", "remaining_time": "0:27:02", "throughput": 5755.89, "total_tokens": 12802736} {"current_steps": 19620, "total_steps": 33920, "loss": 0.3562, "lr": 4.505305922791341e-06, "epoch": 11.568396226415095, "percentage": 57.84, "elapsed_time": "0:37:04", "remaining_time": "0:27:01", "throughput": 5756.0, "total_tokens": 12806384} {"current_steps": 19625, "total_steps": 33920, "loss": 0.3332, "lr": 4.502745897254716e-06, "epoch": 11.571344339622641, "percentage": 57.86, "elapsed_time": "0:37:05", "remaining_time": "0:27:01", "throughput": 5755.96, "total_tokens": 12809456} {"current_steps": 19630, "total_steps": 33920, "loss": 0.337, "lr": 4.500186003368257e-06, "epoch": 11.57429245283019, "percentage": 57.87, "elapsed_time": "0:37:05", "remaining_time": "0:27:00", "throughput": 5755.96, "total_tokens": 12812528} {"current_steps": 19635, "total_steps": 33920, "loss": 0.3819, "lr": 4.497626241809709e-06, "epoch": 11.577240566037736, "percentage": 57.89, "elapsed_time": "0:37:06", "remaining_time": "0:26:59", "throughput": 5756.05, "total_tokens": 12816048} {"current_steps": 19640, "total_steps": 33920, "loss": 0.2827, "lr": 4.4950666132567775e-06, "epoch": 11.580188679245284, "percentage": 57.9, "elapsed_time": "0:37:07", "remaining_time": "0:26:59", "throughput": 5755.98, "total_tokens": 12818992} {"current_steps": 19645, "total_steps": 33920, "loss": 0.4781, "lr": 4.492507118387136e-06, "epoch": 11.58313679245283, "percentage": 57.92, "elapsed_time": "0:37:07", "remaining_time": "0:26:58", "throughput": 5755.96, "total_tokens": 12822064} {"current_steps": 19650, "total_steps": 33920, "loss": 0.335, "lr": 4.4899477578784235e-06, "epoch": 11.586084905660378, "percentage": 57.93, "elapsed_time": "0:37:08", "remaining_time": "0:26:58", "throughput": 5756.17, "total_tokens": 12825904} {"current_steps": 19655, "total_steps": 33920, "loss": 0.2272, "lr": 4.487388532408239e-06, "epoch": 11.589033018867925, "percentage": 57.95, "elapsed_time": "0:37:08", "remaining_time": "0:26:57", "throughput": 5756.43, "total_tokens": 12830160} {"current_steps": 19660, "total_steps": 33920, "loss": 0.338, "lr": 4.48482944265415e-06, "epoch": 11.591981132075471, "percentage": 57.96, "elapsed_time": "0:37:09", "remaining_time": "0:26:57", "throughput": 5756.47, "total_tokens": 12833360} {"current_steps": 19665, "total_steps": 33920, "loss": 0.2952, "lr": 4.482270489293685e-06, "epoch": 11.59492924528302, "percentage": 57.97, "elapsed_time": "0:37:09", "remaining_time": "0:26:56", "throughput": 5756.43, "total_tokens": 12836208} {"current_steps": 19670, "total_steps": 33920, "loss": 0.3761, "lr": 4.479711673004341e-06, "epoch": 11.597877358490566, "percentage": 57.99, "elapsed_time": "0:37:10", "remaining_time": "0:26:55", "throughput": 5756.59, "total_tokens": 12839984} {"current_steps": 19675, "total_steps": 33920, "loss": 0.2245, "lr": 4.477152994463575e-06, "epoch": 11.600825471698114, "percentage": 58.0, "elapsed_time": "0:37:11", "remaining_time": "0:26:55", "throughput": 5756.54, "total_tokens": 12843088} {"current_steps": 19680, "total_steps": 33920, "loss": 0.3974, "lr": 4.474594454348805e-06, "epoch": 11.60377358490566, "percentage": 58.02, "elapsed_time": "0:37:11", "remaining_time": "0:26:54", "throughput": 5756.75, "total_tokens": 12846736} {"current_steps": 19685, "total_steps": 33920, "loss": 0.3732, "lr": 4.472036053337419e-06, "epoch": 11.606721698113208, "percentage": 58.03, "elapsed_time": "0:37:12", "remaining_time": "0:26:54", "throughput": 5756.56, "total_tokens": 12849200} {"current_steps": 19690, "total_steps": 33920, "loss": 0.358, "lr": 4.469477792106761e-06, "epoch": 11.609669811320755, "percentage": 58.05, "elapsed_time": "0:37:12", "remaining_time": "0:26:53", "throughput": 5756.54, "total_tokens": 12852080} {"current_steps": 19695, "total_steps": 33920, "loss": 0.3108, "lr": 4.466919671334146e-06, "epoch": 11.612617924528301, "percentage": 58.06, "elapsed_time": "0:37:13", "remaining_time": "0:26:52", "throughput": 5756.48, "total_tokens": 12854864} {"current_steps": 19700, "total_steps": 33920, "loss": 0.3447, "lr": 4.4643616916968456e-06, "epoch": 11.61556603773585, "percentage": 58.08, "elapsed_time": "0:37:13", "remaining_time": "0:26:52", "throughput": 5756.39, "total_tokens": 12857776} {"current_steps": 19705, "total_steps": 33920, "loss": 0.3862, "lr": 4.461803853872095e-06, "epoch": 11.618514150943396, "percentage": 58.09, "elapsed_time": "0:37:14", "remaining_time": "0:26:51", "throughput": 5756.56, "total_tokens": 12861360} {"current_steps": 19710, "total_steps": 33920, "loss": 0.2916, "lr": 4.459246158537094e-06, "epoch": 11.621462264150944, "percentage": 58.11, "elapsed_time": "0:37:14", "remaining_time": "0:26:51", "throughput": 5756.72, "total_tokens": 12864976} {"current_steps": 19715, "total_steps": 33920, "loss": 0.3191, "lr": 4.456688606369003e-06, "epoch": 11.62441037735849, "percentage": 58.12, "elapsed_time": "0:37:15", "remaining_time": "0:26:50", "throughput": 5756.56, "total_tokens": 12867856} {"current_steps": 19720, "total_steps": 33920, "loss": 0.251, "lr": 4.4541311980449446e-06, "epoch": 11.627358490566039, "percentage": 58.14, "elapsed_time": "0:37:16", "remaining_time": "0:26:50", "throughput": 5757.16, "total_tokens": 12876464} {"current_steps": 19725, "total_steps": 33920, "loss": 0.3129, "lr": 4.4515739342420045e-06, "epoch": 11.630306603773585, "percentage": 58.15, "elapsed_time": "0:37:17", "remaining_time": "0:26:49", "throughput": 5757.25, "total_tokens": 12879952} {"current_steps": 19730, "total_steps": 33920, "loss": 0.4182, "lr": 4.4490168156372294e-06, "epoch": 11.633254716981131, "percentage": 58.17, "elapsed_time": "0:37:17", "remaining_time": "0:26:49", "throughput": 5757.31, "total_tokens": 12883088} {"current_steps": 19735, "total_steps": 33920, "loss": 0.3258, "lr": 4.446459842907626e-06, "epoch": 11.63620283018868, "percentage": 58.18, "elapsed_time": "0:37:18", "remaining_time": "0:26:48", "throughput": 5757.11, "total_tokens": 12885840} {"current_steps": 19740, "total_steps": 33920, "loss": 0.3486, "lr": 4.443903016730165e-06, "epoch": 11.639150943396226, "percentage": 58.2, "elapsed_time": "0:37:18", "remaining_time": "0:26:48", "throughput": 5756.79, "total_tokens": 12888656} {"current_steps": 19745, "total_steps": 33920, "loss": 0.3017, "lr": 4.4413463377817775e-06, "epoch": 11.642099056603774, "percentage": 58.21, "elapsed_time": "0:37:19", "remaining_time": "0:26:47", "throughput": 5757.06, "total_tokens": 12892880} {"current_steps": 19750, "total_steps": 33920, "loss": 0.3611, "lr": 4.438789806739353e-06, "epoch": 11.64504716981132, "percentage": 58.23, "elapsed_time": "0:37:20", "remaining_time": "0:26:47", "throughput": 5756.95, "total_tokens": 12895792} {"current_steps": 19755, "total_steps": 33920, "loss": 0.3311, "lr": 4.436233424279746e-06, "epoch": 11.647995283018869, "percentage": 58.24, "elapsed_time": "0:37:20", "remaining_time": "0:26:46", "throughput": 5756.84, "total_tokens": 12898672} {"current_steps": 19760, "total_steps": 33920, "loss": 0.4604, "lr": 4.433677191079771e-06, "epoch": 11.650943396226415, "percentage": 58.25, "elapsed_time": "0:37:21", "remaining_time": "0:26:46", "throughput": 5756.82, "total_tokens": 12902576} {"current_steps": 19765, "total_steps": 33920, "loss": 0.3461, "lr": 4.431121107816201e-06, "epoch": 11.653891509433961, "percentage": 58.27, "elapsed_time": "0:37:21", "remaining_time": "0:26:45", "throughput": 5756.77, "total_tokens": 12905616} {"current_steps": 19770, "total_steps": 33920, "loss": 0.4085, "lr": 4.4285651751657676e-06, "epoch": 11.65683962264151, "percentage": 58.28, "elapsed_time": "0:37:22", "remaining_time": "0:26:44", "throughput": 5756.81, "total_tokens": 12908752} {"current_steps": 19775, "total_steps": 33920, "loss": 0.4832, "lr": 4.4260093938051685e-06, "epoch": 11.659787735849056, "percentage": 58.3, "elapsed_time": "0:37:22", "remaining_time": "0:26:44", "throughput": 5756.68, "total_tokens": 12911824} {"current_steps": 19780, "total_steps": 33920, "loss": 0.2572, "lr": 4.423453764411056e-06, "epoch": 11.662735849056604, "percentage": 58.31, "elapsed_time": "0:37:23", "remaining_time": "0:26:43", "throughput": 5756.7, "total_tokens": 12914992} {"current_steps": 19785, "total_steps": 33920, "loss": 0.3632, "lr": 4.4208982876600425e-06, "epoch": 11.66568396226415, "percentage": 58.33, "elapsed_time": "0:37:24", "remaining_time": "0:26:43", "throughput": 5756.52, "total_tokens": 12917744} {"current_steps": 19790, "total_steps": 33920, "loss": 0.4312, "lr": 4.418342964228705e-06, "epoch": 11.668632075471699, "percentage": 58.34, "elapsed_time": "0:37:24", "remaining_time": "0:26:42", "throughput": 5756.61, "total_tokens": 12921424} {"current_steps": 19795, "total_steps": 33920, "loss": 0.349, "lr": 4.415787794793574e-06, "epoch": 11.671580188679245, "percentage": 58.36, "elapsed_time": "0:37:25", "remaining_time": "0:26:42", "throughput": 5756.52, "total_tokens": 12924336} {"current_steps": 19800, "total_steps": 33920, "loss": 0.3619, "lr": 4.4132327800311414e-06, "epoch": 11.674528301886792, "percentage": 58.37, "elapsed_time": "0:37:25", "remaining_time": "0:26:41", "throughput": 5756.65, "total_tokens": 12927728} {"current_steps": 19805, "total_steps": 33920, "loss": 0.4579, "lr": 4.41067792061786e-06, "epoch": 11.67747641509434, "percentage": 58.39, "elapsed_time": "0:37:26", "remaining_time": "0:26:41", "throughput": 5756.93, "total_tokens": 12932336} {"current_steps": 19810, "total_steps": 33920, "loss": 0.324, "lr": 4.408123217230139e-06, "epoch": 11.680424528301886, "percentage": 58.4, "elapsed_time": "0:37:27", "remaining_time": "0:26:40", "throughput": 5757.15, "total_tokens": 12936688} {"current_steps": 19815, "total_steps": 33920, "loss": 0.3054, "lr": 4.4055686705443464e-06, "epoch": 11.683372641509434, "percentage": 58.42, "elapsed_time": "0:37:27", "remaining_time": "0:26:39", "throughput": 5756.87, "total_tokens": 12939120} {"current_steps": 19820, "total_steps": 33920, "loss": 0.5332, "lr": 4.4030142812368106e-06, "epoch": 11.68632075471698, "percentage": 58.43, "elapsed_time": "0:37:28", "remaining_time": "0:26:39", "throughput": 5756.72, "total_tokens": 12941712} {"current_steps": 19825, "total_steps": 33920, "loss": 0.3176, "lr": 4.400460049983817e-06, "epoch": 11.689268867924529, "percentage": 58.45, "elapsed_time": "0:37:28", "remaining_time": "0:26:38", "throughput": 5756.58, "total_tokens": 12944560} {"current_steps": 19830, "total_steps": 33920, "loss": 0.3162, "lr": 4.397905977461608e-06, "epoch": 11.692216981132075, "percentage": 58.46, "elapsed_time": "0:37:29", "remaining_time": "0:26:38", "throughput": 5756.56, "total_tokens": 12947792} {"current_steps": 19835, "total_steps": 33920, "loss": 0.381, "lr": 4.395352064346387e-06, "epoch": 11.695165094339622, "percentage": 58.48, "elapsed_time": "0:37:29", "remaining_time": "0:26:37", "throughput": 5756.61, "total_tokens": 12951184} {"current_steps": 19840, "total_steps": 33920, "loss": 0.3052, "lr": 4.392798311314314e-06, "epoch": 11.69811320754717, "percentage": 58.49, "elapsed_time": "0:37:30", "remaining_time": "0:26:36", "throughput": 5756.47, "total_tokens": 12953872} {"current_steps": 19845, "total_steps": 33920, "loss": 0.3202, "lr": 4.390244719041502e-06, "epoch": 11.701061320754716, "percentage": 58.51, "elapsed_time": "0:37:30", "remaining_time": "0:26:36", "throughput": 5756.42, "total_tokens": 12956848} {"current_steps": 19850, "total_steps": 33920, "loss": 0.3853, "lr": 4.387691288204029e-06, "epoch": 11.704009433962264, "percentage": 58.52, "elapsed_time": "0:37:31", "remaining_time": "0:26:35", "throughput": 5756.28, "total_tokens": 12959792} {"current_steps": 19855, "total_steps": 33920, "loss": 0.4453, "lr": 4.385138019477928e-06, "epoch": 11.70695754716981, "percentage": 58.53, "elapsed_time": "0:37:32", "remaining_time": "0:26:35", "throughput": 5756.45, "total_tokens": 12963728} {"current_steps": 19860, "total_steps": 33920, "loss": 0.3877, "lr": 4.3825849135391864e-06, "epoch": 11.709905660377359, "percentage": 58.55, "elapsed_time": "0:37:32", "remaining_time": "0:26:34", "throughput": 5756.53, "total_tokens": 12966928} {"current_steps": 19865, "total_steps": 33920, "loss": 0.3766, "lr": 4.380031971063748e-06, "epoch": 11.712853773584905, "percentage": 58.56, "elapsed_time": "0:37:33", "remaining_time": "0:26:34", "throughput": 5756.54, "total_tokens": 12970544} {"current_steps": 19870, "total_steps": 33920, "loss": 0.2545, "lr": 4.37747919272752e-06, "epoch": 11.715801886792454, "percentage": 58.58, "elapsed_time": "0:37:33", "remaining_time": "0:26:33", "throughput": 5756.57, "total_tokens": 12973904} {"current_steps": 19875, "total_steps": 33920, "loss": 0.3655, "lr": 4.374926579206357e-06, "epoch": 11.71875, "percentage": 58.59, "elapsed_time": "0:37:34", "remaining_time": "0:26:33", "throughput": 5756.63, "total_tokens": 12977232} {"current_steps": 19880, "total_steps": 33920, "loss": 0.3731, "lr": 4.372374131176075e-06, "epoch": 11.721698113207546, "percentage": 58.61, "elapsed_time": "0:37:34", "remaining_time": "0:26:32", "throughput": 5756.44, "total_tokens": 12980016} {"current_steps": 19885, "total_steps": 33920, "loss": 0.3131, "lr": 4.369821849312449e-06, "epoch": 11.724646226415095, "percentage": 58.62, "elapsed_time": "0:37:35", "remaining_time": "0:26:31", "throughput": 5756.22, "total_tokens": 12982736} {"current_steps": 19890, "total_steps": 33920, "loss": 0.3864, "lr": 4.367269734291203e-06, "epoch": 11.727594339622641, "percentage": 58.64, "elapsed_time": "0:37:36", "remaining_time": "0:26:31", "throughput": 5756.37, "total_tokens": 12986480} {"current_steps": 19895, "total_steps": 33920, "loss": 0.3393, "lr": 4.364717786788022e-06, "epoch": 11.73054245283019, "percentage": 58.65, "elapsed_time": "0:37:36", "remaining_time": "0:26:30", "throughput": 5756.28, "total_tokens": 12989296} {"current_steps": 19900, "total_steps": 33920, "loss": 0.304, "lr": 4.362166007478545e-06, "epoch": 11.733490566037736, "percentage": 58.67, "elapsed_time": "0:37:37", "remaining_time": "0:26:30", "throughput": 5756.47, "total_tokens": 12993008} {"current_steps": 19905, "total_steps": 33920, "loss": 0.3506, "lr": 4.3596143970383665e-06, "epoch": 11.736438679245284, "percentage": 58.68, "elapsed_time": "0:37:37", "remaining_time": "0:26:29", "throughput": 5756.6, "total_tokens": 12996528} {"current_steps": 19910, "total_steps": 33920, "loss": 0.2346, "lr": 4.357062956143035e-06, "epoch": 11.73938679245283, "percentage": 58.7, "elapsed_time": "0:37:38", "remaining_time": "0:26:29", "throughput": 5756.69, "total_tokens": 12999888} {"current_steps": 19915, "total_steps": 33920, "loss": 0.3916, "lr": 4.354511685468059e-06, "epoch": 11.742334905660378, "percentage": 58.71, "elapsed_time": "0:37:38", "remaining_time": "0:26:28", "throughput": 5756.77, "total_tokens": 13003216} {"current_steps": 19920, "total_steps": 33920, "loss": 0.4338, "lr": 4.351960585688894e-06, "epoch": 11.745283018867925, "percentage": 58.73, "elapsed_time": "0:37:39", "remaining_time": "0:26:27", "throughput": 5756.79, "total_tokens": 13006736} {"current_steps": 19925, "total_steps": 33920, "loss": 0.3118, "lr": 4.349409657480959e-06, "epoch": 11.748231132075471, "percentage": 58.74, "elapsed_time": "0:37:39", "remaining_time": "0:26:27", "throughput": 5756.81, "total_tokens": 13009680} {"current_steps": 19930, "total_steps": 33920, "loss": 0.2942, "lr": 4.34685890151962e-06, "epoch": 11.75117924528302, "percentage": 58.76, "elapsed_time": "0:37:40", "remaining_time": "0:26:26", "throughput": 5756.86, "total_tokens": 13013040} {"current_steps": 19935, "total_steps": 33920, "loss": 0.3928, "lr": 4.344308318480201e-06, "epoch": 11.754127358490566, "percentage": 58.77, "elapsed_time": "0:37:40", "remaining_time": "0:26:26", "throughput": 5756.69, "total_tokens": 13015504} {"current_steps": 19940, "total_steps": 33920, "loss": 0.434, "lr": 4.341757909037981e-06, "epoch": 11.757075471698114, "percentage": 58.79, "elapsed_time": "0:37:41", "remaining_time": "0:26:25", "throughput": 5756.88, "total_tokens": 13019152} {"current_steps": 19945, "total_steps": 33920, "loss": 0.3215, "lr": 4.33920767386819e-06, "epoch": 11.76002358490566, "percentage": 58.8, "elapsed_time": "0:37:42", "remaining_time": "0:26:24", "throughput": 5756.81, "total_tokens": 13022128} {"current_steps": 19950, "total_steps": 33920, "loss": 0.3521, "lr": 4.336657613646017e-06, "epoch": 11.762971698113208, "percentage": 58.81, "elapsed_time": "0:37:42", "remaining_time": "0:26:24", "throughput": 5756.75, "total_tokens": 13024784} {"current_steps": 19955, "total_steps": 33920, "loss": 0.2877, "lr": 4.3341077290466e-06, "epoch": 11.765919811320755, "percentage": 58.83, "elapsed_time": "0:37:43", "remaining_time": "0:26:23", "throughput": 5756.81, "total_tokens": 13028176} {"current_steps": 19960, "total_steps": 33920, "loss": 0.3249, "lr": 4.331558020745031e-06, "epoch": 11.768867924528301, "percentage": 58.84, "elapsed_time": "0:37:43", "remaining_time": "0:26:23", "throughput": 5756.93, "total_tokens": 13032272} {"current_steps": 19965, "total_steps": 33920, "loss": 0.3644, "lr": 4.329008489416357e-06, "epoch": 11.77181603773585, "percentage": 58.86, "elapsed_time": "0:37:44", "remaining_time": "0:26:22", "throughput": 5756.79, "total_tokens": 13034832} {"current_steps": 19970, "total_steps": 33920, "loss": 0.4821, "lr": 4.326459135735576e-06, "epoch": 11.774764150943396, "percentage": 58.87, "elapsed_time": "0:37:44", "remaining_time": "0:26:22", "throughput": 5756.57, "total_tokens": 13037200} {"current_steps": 19975, "total_steps": 33920, "loss": 0.2726, "lr": 4.323909960377644e-06, "epoch": 11.777712264150944, "percentage": 58.89, "elapsed_time": "0:37:45", "remaining_time": "0:26:21", "throughput": 5756.86, "total_tokens": 13041680} {"current_steps": 19980, "total_steps": 33920, "loss": 0.3055, "lr": 4.3213609640174625e-06, "epoch": 11.78066037735849, "percentage": 58.9, "elapsed_time": "0:37:45", "remaining_time": "0:26:20", "throughput": 5756.76, "total_tokens": 13044528} {"current_steps": 19985, "total_steps": 33920, "loss": 0.4243, "lr": 4.318812147329889e-06, "epoch": 11.783608490566039, "percentage": 58.92, "elapsed_time": "0:37:46", "remaining_time": "0:26:20", "throughput": 5756.7, "total_tokens": 13047248} {"current_steps": 19990, "total_steps": 33920, "loss": 0.3191, "lr": 4.316263510989737e-06, "epoch": 11.786556603773585, "percentage": 58.93, "elapsed_time": "0:37:47", "remaining_time": "0:26:19", "throughput": 5756.78, "total_tokens": 13050928} {"current_steps": 19995, "total_steps": 33920, "loss": 0.4503, "lr": 4.313715055671768e-06, "epoch": 11.789504716981131, "percentage": 58.95, "elapsed_time": "0:37:47", "remaining_time": "0:26:19", "throughput": 5756.68, "total_tokens": 13053616} {"current_steps": 20000, "total_steps": 33920, "loss": 0.3559, "lr": 4.311166782050694e-06, "epoch": 11.79245283018868, "percentage": 58.96, "elapsed_time": "0:37:48", "remaining_time": "0:26:18", "throughput": 5756.64, "total_tokens": 13056400} {"current_steps": 20005, "total_steps": 33920, "loss": 0.3114, "lr": 4.308618690801184e-06, "epoch": 11.795400943396226, "percentage": 58.98, "elapsed_time": "0:37:48", "remaining_time": "0:26:17", "throughput": 5756.58, "total_tokens": 13059184} {"current_steps": 20010, "total_steps": 33920, "loss": 0.2989, "lr": 4.3060707825978564e-06, "epoch": 11.798349056603774, "percentage": 58.99, "elapsed_time": "0:37:49", "remaining_time": "0:26:17", "throughput": 5756.7, "total_tokens": 13062576} {"current_steps": 20015, "total_steps": 33920, "loss": 0.2936, "lr": 4.303523058115278e-06, "epoch": 11.80129716981132, "percentage": 59.01, "elapsed_time": "0:37:49", "remaining_time": "0:26:16", "throughput": 5756.66, "total_tokens": 13065712} {"current_steps": 20020, "total_steps": 33920, "loss": 0.4175, "lr": 4.300975518027972e-06, "epoch": 11.804245283018869, "percentage": 59.02, "elapsed_time": "0:37:50", "remaining_time": "0:26:16", "throughput": 5756.72, "total_tokens": 13068848} {"current_steps": 20025, "total_steps": 33920, "loss": 0.4302, "lr": 4.298428163010411e-06, "epoch": 11.807193396226415, "percentage": 59.04, "elapsed_time": "0:37:50", "remaining_time": "0:26:15", "throughput": 5756.44, "total_tokens": 13071408} {"current_steps": 20030, "total_steps": 33920, "loss": 0.3091, "lr": 4.295880993737016e-06, "epoch": 11.810141509433961, "percentage": 59.05, "elapsed_time": "0:37:51", "remaining_time": "0:26:15", "throughput": 5756.41, "total_tokens": 13074736} {"current_steps": 20035, "total_steps": 33920, "loss": 0.2936, "lr": 4.293334010882164e-06, "epoch": 11.81308962264151, "percentage": 59.07, "elapsed_time": "0:37:51", "remaining_time": "0:26:14", "throughput": 5756.22, "total_tokens": 13077168} {"current_steps": 20040, "total_steps": 33920, "loss": 0.3821, "lr": 4.290787215120178e-06, "epoch": 11.816037735849056, "percentage": 59.08, "elapsed_time": "0:37:52", "remaining_time": "0:26:13", "throughput": 5756.26, "total_tokens": 13080656} {"current_steps": 20045, "total_steps": 33920, "loss": 0.3946, "lr": 4.2882406071253315e-06, "epoch": 11.818985849056604, "percentage": 59.09, "elapsed_time": "0:37:53", "remaining_time": "0:26:13", "throughput": 5756.42, "total_tokens": 13084496} {"current_steps": 20050, "total_steps": 33920, "loss": 0.326, "lr": 4.285694187571852e-06, "epoch": 11.82193396226415, "percentage": 59.11, "elapsed_time": "0:37:53", "remaining_time": "0:26:12", "throughput": 5756.16, "total_tokens": 13086864} {"current_steps": 20055, "total_steps": 33920, "loss": 0.3551, "lr": 4.283147957133917e-06, "epoch": 11.824882075471699, "percentage": 59.12, "elapsed_time": "0:37:54", "remaining_time": "0:26:12", "throughput": 5756.21, "total_tokens": 13090256} {"current_steps": 20060, "total_steps": 33920, "loss": 0.5957, "lr": 4.280601916485648e-06, "epoch": 11.827830188679245, "percentage": 59.14, "elapsed_time": "0:37:54", "remaining_time": "0:26:11", "throughput": 5756.49, "total_tokens": 13094544} {"current_steps": 20065, "total_steps": 33920, "loss": 0.373, "lr": 4.278056066301123e-06, "epoch": 11.830778301886792, "percentage": 59.15, "elapsed_time": "0:37:55", "remaining_time": "0:26:11", "throughput": 5756.6, "total_tokens": 13098096} {"current_steps": 20070, "total_steps": 33920, "loss": 0.3699, "lr": 4.275510407254366e-06, "epoch": 11.83372641509434, "percentage": 59.17, "elapsed_time": "0:37:55", "remaining_time": "0:26:10", "throughput": 5756.72, "total_tokens": 13101648} {"current_steps": 20075, "total_steps": 33920, "loss": 0.5472, "lr": 4.27296494001935e-06, "epoch": 11.836674528301886, "percentage": 59.18, "elapsed_time": "0:37:56", "remaining_time": "0:26:09", "throughput": 5756.43, "total_tokens": 13103760} {"current_steps": 20080, "total_steps": 33920, "loss": 0.3275, "lr": 4.2704196652700005e-06, "epoch": 11.839622641509434, "percentage": 59.2, "elapsed_time": "0:37:56", "remaining_time": "0:26:09", "throughput": 5756.28, "total_tokens": 13106256} {"current_steps": 20085, "total_steps": 33920, "loss": 0.3523, "lr": 4.2678745836801895e-06, "epoch": 11.84257075471698, "percentage": 59.21, "elapsed_time": "0:37:57", "remaining_time": "0:26:08", "throughput": 5756.13, "total_tokens": 13109072} {"current_steps": 20090, "total_steps": 33920, "loss": 0.3538, "lr": 4.265329695923736e-06, "epoch": 11.845518867924529, "percentage": 59.23, "elapsed_time": "0:37:57", "remaining_time": "0:26:08", "throughput": 5755.79, "total_tokens": 13111312} {"current_steps": 20095, "total_steps": 33920, "loss": 0.3267, "lr": 4.262785002674412e-06, "epoch": 11.848466981132075, "percentage": 59.24, "elapsed_time": "0:37:58", "remaining_time": "0:26:07", "throughput": 5755.93, "total_tokens": 13115408} {"current_steps": 20100, "total_steps": 33920, "loss": 0.347, "lr": 4.260240504605938e-06, "epoch": 11.851415094339622, "percentage": 59.26, "elapsed_time": "0:37:59", "remaining_time": "0:26:07", "throughput": 5755.75, "total_tokens": 13117968} {"current_steps": 20105, "total_steps": 33920, "loss": 0.3731, "lr": 4.2576962023919775e-06, "epoch": 11.85436320754717, "percentage": 59.27, "elapsed_time": "0:37:59", "remaining_time": "0:26:06", "throughput": 5755.9, "total_tokens": 13121680} {"current_steps": 20110, "total_steps": 33920, "loss": 0.3094, "lr": 4.255152096706145e-06, "epoch": 11.857311320754716, "percentage": 59.29, "elapsed_time": "0:38:00", "remaining_time": "0:26:05", "throughput": 5755.76, "total_tokens": 13124336} {"current_steps": 20115, "total_steps": 33920, "loss": 0.2977, "lr": 4.252608188222007e-06, "epoch": 11.860259433962264, "percentage": 59.3, "elapsed_time": "0:38:00", "remaining_time": "0:26:05", "throughput": 5755.92, "total_tokens": 13128240} {"current_steps": 20120, "total_steps": 33920, "loss": 0.3837, "lr": 4.250064477613071e-06, "epoch": 11.86320754716981, "percentage": 59.32, "elapsed_time": "0:38:01", "remaining_time": "0:26:04", "throughput": 5755.67, "total_tokens": 13130928} {"current_steps": 20125, "total_steps": 33920, "loss": 0.3878, "lr": 4.247520965552797e-06, "epoch": 11.866155660377359, "percentage": 59.33, "elapsed_time": "0:38:01", "remaining_time": "0:26:04", "throughput": 5755.4, "total_tokens": 13133360} {"current_steps": 20130, "total_steps": 33920, "loss": 0.3664, "lr": 4.24497765271459e-06, "epoch": 11.869103773584905, "percentage": 59.35, "elapsed_time": "0:38:02", "remaining_time": "0:26:03", "throughput": 5755.05, "total_tokens": 13135760} {"current_steps": 20135, "total_steps": 33920, "loss": 0.23, "lr": 4.242434539771804e-06, "epoch": 11.872051886792454, "percentage": 59.36, "elapsed_time": "0:38:03", "remaining_time": "0:26:03", "throughput": 5754.95, "total_tokens": 13138736} {"current_steps": 20140, "total_steps": 33920, "loss": 0.3659, "lr": 4.239891627397737e-06, "epoch": 11.875, "percentage": 59.38, "elapsed_time": "0:38:03", "remaining_time": "0:26:02", "throughput": 5755.08, "total_tokens": 13142320} {"current_steps": 20145, "total_steps": 33920, "loss": 0.314, "lr": 4.237348916265638e-06, "epoch": 11.877948113207546, "percentage": 59.39, "elapsed_time": "0:38:04", "remaining_time": "0:26:01", "throughput": 5755.13, "total_tokens": 13145424} {"current_steps": 20150, "total_steps": 33920, "loss": 0.3222, "lr": 4.234806407048702e-06, "epoch": 11.880896226415095, "percentage": 59.4, "elapsed_time": "0:38:04", "remaining_time": "0:26:01", "throughput": 5754.95, "total_tokens": 13148272} {"current_steps": 20155, "total_steps": 33920, "loss": 0.3203, "lr": 4.232264100420066e-06, "epoch": 11.883844339622641, "percentage": 59.42, "elapsed_time": "0:38:05", "remaining_time": "0:26:00", "throughput": 5755.29, "total_tokens": 13152944} {"current_steps": 20160, "total_steps": 33920, "loss": 0.3395, "lr": 4.229721997052819e-06, "epoch": 11.88679245283019, "percentage": 59.43, "elapsed_time": "0:38:06", "remaining_time": "0:26:00", "throughput": 5755.41, "total_tokens": 13157200} {"current_steps": 20165, "total_steps": 33920, "loss": 0.2976, "lr": 4.227180097619993e-06, "epoch": 11.889740566037736, "percentage": 59.45, "elapsed_time": "0:38:06", "remaining_time": "0:25:59", "throughput": 5755.31, "total_tokens": 13160080} {"current_steps": 20170, "total_steps": 33920, "loss": 0.3071, "lr": 4.224638402794566e-06, "epoch": 11.892688679245284, "percentage": 59.46, "elapsed_time": "0:38:07", "remaining_time": "0:25:59", "throughput": 5755.35, "total_tokens": 13163088} {"current_steps": 20175, "total_steps": 33920, "loss": 0.3437, "lr": 4.222096913249464e-06, "epoch": 11.89563679245283, "percentage": 59.48, "elapsed_time": "0:38:07", "remaining_time": "0:25:58", "throughput": 5755.55, "total_tokens": 13167440} {"current_steps": 20180, "total_steps": 33920, "loss": 0.3684, "lr": 4.219555629657558e-06, "epoch": 11.898584905660378, "percentage": 59.49, "elapsed_time": "0:38:08", "remaining_time": "0:25:58", "throughput": 5755.33, "total_tokens": 13170256} {"current_steps": 20185, "total_steps": 33920, "loss": 0.1981, "lr": 4.21701455269166e-06, "epoch": 11.901533018867925, "percentage": 59.51, "elapsed_time": "0:38:09", "remaining_time": "0:25:57", "throughput": 5755.57, "total_tokens": 13175504} {"current_steps": 20190, "total_steps": 33920, "loss": 0.3874, "lr": 4.2144736830245356e-06, "epoch": 11.904481132075471, "percentage": 59.52, "elapsed_time": "0:38:09", "remaining_time": "0:25:57", "throughput": 5755.63, "total_tokens": 13178768} {"current_steps": 20195, "total_steps": 33920, "loss": 0.2877, "lr": 4.211933021328889e-06, "epoch": 11.90742924528302, "percentage": 59.54, "elapsed_time": "0:38:10", "remaining_time": "0:25:56", "throughput": 5755.52, "total_tokens": 13181456} {"current_steps": 20200, "total_steps": 33920, "loss": 0.432, "lr": 4.20939256827737e-06, "epoch": 11.910377358490566, "percentage": 59.55, "elapsed_time": "0:38:10", "remaining_time": "0:25:55", "throughput": 5755.65, "total_tokens": 13185008} {"current_steps": 20205, "total_steps": 33920, "loss": 0.3265, "lr": 4.206852324542578e-06, "epoch": 11.913325471698114, "percentage": 59.57, "elapsed_time": "0:38:11", "remaining_time": "0:25:55", "throughput": 5755.77, "total_tokens": 13188976} {"current_steps": 20210, "total_steps": 33920, "loss": 0.3963, "lr": 4.2043122907970496e-06, "epoch": 11.91627358490566, "percentage": 59.58, "elapsed_time": "0:38:11", "remaining_time": "0:25:54", "throughput": 5755.81, "total_tokens": 13191856} {"current_steps": 20215, "total_steps": 33920, "loss": 0.3803, "lr": 4.2017724677132715e-06, "epoch": 11.919221698113208, "percentage": 59.6, "elapsed_time": "0:38:12", "remaining_time": "0:25:54", "throughput": 5755.75, "total_tokens": 13194800} {"current_steps": 20220, "total_steps": 33920, "loss": 0.4519, "lr": 4.1992328559636734e-06, "epoch": 11.922169811320755, "percentage": 59.61, "elapsed_time": "0:38:12", "remaining_time": "0:25:53", "throughput": 5755.5, "total_tokens": 13197328} {"current_steps": 20225, "total_steps": 33920, "loss": 0.3107, "lr": 4.196693456220628e-06, "epoch": 11.925117924528301, "percentage": 59.63, "elapsed_time": "0:38:13", "remaining_time": "0:25:53", "throughput": 5755.75, "total_tokens": 13201104} {"current_steps": 20230, "total_steps": 33920, "loss": 0.3754, "lr": 4.194154269156452e-06, "epoch": 11.92806603773585, "percentage": 59.64, "elapsed_time": "0:38:14", "remaining_time": "0:25:52", "throughput": 5755.86, "total_tokens": 13204624} {"current_steps": 20235, "total_steps": 33920, "loss": 0.4644, "lr": 4.191615295443404e-06, "epoch": 11.931014150943396, "percentage": 59.66, "elapsed_time": "0:38:14", "remaining_time": "0:25:51", "throughput": 5755.76, "total_tokens": 13207312} {"current_steps": 20240, "total_steps": 33920, "loss": 0.2378, "lr": 4.189076535753692e-06, "epoch": 11.933962264150944, "percentage": 59.67, "elapsed_time": "0:38:15", "remaining_time": "0:25:51", "throughput": 5755.95, "total_tokens": 13211184} {"current_steps": 20245, "total_steps": 33920, "loss": 0.3686, "lr": 4.186537990759464e-06, "epoch": 11.93691037735849, "percentage": 59.68, "elapsed_time": "0:38:15", "remaining_time": "0:25:50", "throughput": 5755.92, "total_tokens": 13214064} {"current_steps": 20250, "total_steps": 33920, "loss": 0.4844, "lr": 4.183999661132806e-06, "epoch": 11.939858490566039, "percentage": 59.7, "elapsed_time": "0:38:16", "remaining_time": "0:25:50", "throughput": 5755.97, "total_tokens": 13217136} {"current_steps": 20255, "total_steps": 33920, "loss": 0.2784, "lr": 4.181461547545756e-06, "epoch": 11.942806603773585, "percentage": 59.71, "elapsed_time": "0:38:16", "remaining_time": "0:25:49", "throughput": 5755.93, "total_tokens": 13220176} {"current_steps": 20260, "total_steps": 33920, "loss": 0.369, "lr": 4.178923650670289e-06, "epoch": 11.945754716981131, "percentage": 59.73, "elapsed_time": "0:38:17", "remaining_time": "0:25:48", "throughput": 5755.71, "total_tokens": 13222608} {"current_steps": 20265, "total_steps": 33920, "loss": 0.4154, "lr": 4.176385971178324e-06, "epoch": 11.94870283018868, "percentage": 59.74, "elapsed_time": "0:38:17", "remaining_time": "0:25:48", "throughput": 5755.78, "total_tokens": 13225904} {"current_steps": 20270, "total_steps": 33920, "loss": 0.376, "lr": 4.1738485097417225e-06, "epoch": 11.951650943396226, "percentage": 59.76, "elapsed_time": "0:38:18", "remaining_time": "0:25:47", "throughput": 5755.8, "total_tokens": 13229136} {"current_steps": 20275, "total_steps": 33920, "loss": 0.3338, "lr": 4.1713112670322886e-06, "epoch": 11.954599056603774, "percentage": 59.77, "elapsed_time": "0:38:18", "remaining_time": "0:25:47", "throughput": 5755.7, "total_tokens": 13231792} {"current_steps": 20280, "total_steps": 33920, "loss": 0.3771, "lr": 4.168774243721768e-06, "epoch": 11.95754716981132, "percentage": 59.79, "elapsed_time": "0:38:19", "remaining_time": "0:25:46", "throughput": 5755.99, "total_tokens": 13238160} {"current_steps": 20285, "total_steps": 33920, "loss": 0.3378, "lr": 4.166237440481849e-06, "epoch": 11.960495283018869, "percentage": 59.8, "elapsed_time": "0:38:20", "remaining_time": "0:25:46", "throughput": 5756.21, "total_tokens": 13242448} {"current_steps": 20290, "total_steps": 33920, "loss": 0.3214, "lr": 4.163700857984162e-06, "epoch": 11.963443396226415, "percentage": 59.82, "elapsed_time": "0:38:21", "remaining_time": "0:25:45", "throughput": 5756.27, "total_tokens": 13245648} {"current_steps": 20295, "total_steps": 33920, "loss": 0.5059, "lr": 4.161164496900275e-06, "epoch": 11.966391509433961, "percentage": 59.83, "elapsed_time": "0:38:21", "remaining_time": "0:25:45", "throughput": 5756.31, "total_tokens": 13248752} {"current_steps": 20300, "total_steps": 33920, "loss": 0.3935, "lr": 4.1586283579017036e-06, "epoch": 11.96933962264151, "percentage": 59.85, "elapsed_time": "0:38:22", "remaining_time": "0:25:44", "throughput": 5756.23, "total_tokens": 13251536} {"current_steps": 20305, "total_steps": 33920, "loss": 0.2989, "lr": 4.156092441659901e-06, "epoch": 11.972287735849056, "percentage": 59.86, "elapsed_time": "0:38:22", "remaining_time": "0:25:44", "throughput": 5756.19, "total_tokens": 13254672} {"current_steps": 20310, "total_steps": 33920, "loss": 0.3406, "lr": 4.153556748846261e-06, "epoch": 11.975235849056604, "percentage": 59.88, "elapsed_time": "0:38:23", "remaining_time": "0:25:43", "throughput": 5756.11, "total_tokens": 13257680} {"current_steps": 20315, "total_steps": 33920, "loss": 0.2483, "lr": 4.15102128013212e-06, "epoch": 11.97818396226415, "percentage": 59.89, "elapsed_time": "0:38:23", "remaining_time": "0:25:42", "throughput": 5755.99, "total_tokens": 13260656} {"current_steps": 20320, "total_steps": 33920, "loss": 0.3695, "lr": 4.1484860361887544e-06, "epoch": 11.981132075471699, "percentage": 59.91, "elapsed_time": "0:38:24", "remaining_time": "0:25:42", "throughput": 5756.08, "total_tokens": 13263888} {"current_steps": 20325, "total_steps": 33920, "loss": 0.4148, "lr": 4.145951017687379e-06, "epoch": 11.984080188679245, "percentage": 59.92, "elapsed_time": "0:38:24", "remaining_time": "0:25:41", "throughput": 5755.98, "total_tokens": 13266640} {"current_steps": 20330, "total_steps": 33920, "loss": 0.4365, "lr": 4.1434162252991524e-06, "epoch": 11.987028301886792, "percentage": 59.94, "elapsed_time": "0:38:25", "remaining_time": "0:25:41", "throughput": 5755.97, "total_tokens": 13270096} {"current_steps": 20335, "total_steps": 33920, "loss": 0.3419, "lr": 4.140881659695173e-06, "epoch": 11.98997641509434, "percentage": 59.95, "elapsed_time": "0:38:25", "remaining_time": "0:25:40", "throughput": 5755.99, "total_tokens": 13273200} {"current_steps": 20340, "total_steps": 33920, "loss": 0.4011, "lr": 4.138347321546477e-06, "epoch": 11.992924528301886, "percentage": 59.96, "elapsed_time": "0:38:26", "remaining_time": "0:25:39", "throughput": 5756.09, "total_tokens": 13276400} {"current_steps": 20345, "total_steps": 33920, "loss": 0.3915, "lr": 4.13581321152404e-06, "epoch": 11.995872641509434, "percentage": 59.98, "elapsed_time": "0:38:27", "remaining_time": "0:25:39", "throughput": 5755.81, "total_tokens": 13278704} {"current_steps": 20350, "total_steps": 33920, "loss": 0.4077, "lr": 4.133279330298781e-06, "epoch": 11.99882075471698, "percentage": 59.99, "elapsed_time": "0:38:27", "remaining_time": "0:25:38", "throughput": 5755.52, "total_tokens": 13281168} {"current_steps": 20352, "total_steps": 33920, "eval_loss": 0.5487748980522156, "epoch": 12.0, "percentage": 60.0, "elapsed_time": "0:38:47", "remaining_time": "0:25:51", "throughput": 5707.03, "total_tokens": 13281912} {"current_steps": 20355, "total_steps": 33920, "loss": 0.353, "lr": 4.130745678541555e-06, "epoch": 12.001768867924529, "percentage": 60.01, "elapsed_time": "0:38:51", "remaining_time": "0:25:53", "throughput": 5698.32, "total_tokens": 13283864} {"current_steps": 20360, "total_steps": 33920, "loss": 0.3585, "lr": 4.128212256923155e-06, "epoch": 12.004716981132075, "percentage": 60.02, "elapsed_time": "0:38:51", "remaining_time": "0:25:53", "throughput": 5698.57, "total_tokens": 13288760} {"current_steps": 20365, "total_steps": 33920, "loss": 0.3218, "lr": 4.125679066114318e-06, "epoch": 12.007665094339623, "percentage": 60.04, "elapsed_time": "0:38:52", "remaining_time": "0:25:52", "throughput": 5698.57, "total_tokens": 13291704} {"current_steps": 20370, "total_steps": 33920, "loss": 0.4386, "lr": 4.123146106785717e-06, "epoch": 12.01061320754717, "percentage": 60.05, "elapsed_time": "0:38:53", "remaining_time": "0:25:52", "throughput": 5698.85, "total_tokens": 13296344} {"current_steps": 20375, "total_steps": 33920, "loss": 0.3174, "lr": 4.1206133796079625e-06, "epoch": 12.013561320754716, "percentage": 60.07, "elapsed_time": "0:38:53", "remaining_time": "0:25:51", "throughput": 5699.08, "total_tokens": 13300216} {"current_steps": 20380, "total_steps": 33920, "loss": 0.3052, "lr": 4.1180808852516065e-06, "epoch": 12.016509433962264, "percentage": 60.08, "elapsed_time": "0:38:54", "remaining_time": "0:25:50", "throughput": 5699.25, "total_tokens": 13303832} {"current_steps": 20385, "total_steps": 33920, "loss": 0.3133, "lr": 4.115548624387136e-06, "epoch": 12.01945754716981, "percentage": 60.1, "elapsed_time": "0:38:54", "remaining_time": "0:25:50", "throughput": 5699.15, "total_tokens": 13306424} {"current_steps": 20390, "total_steps": 33920, "loss": 0.3835, "lr": 4.113016597684979e-06, "epoch": 12.022405660377359, "percentage": 60.11, "elapsed_time": "0:38:55", "remaining_time": "0:25:49", "throughput": 5699.23, "total_tokens": 13309752} {"current_steps": 20395, "total_steps": 33920, "loss": 0.2298, "lr": 4.110484805815502e-06, "epoch": 12.025353773584905, "percentage": 60.13, "elapsed_time": "0:38:55", "remaining_time": "0:25:49", "throughput": 5699.34, "total_tokens": 13313528} {"current_steps": 20400, "total_steps": 33920, "loss": 0.3466, "lr": 4.107953249449005e-06, "epoch": 12.028301886792454, "percentage": 60.14, "elapsed_time": "0:38:56", "remaining_time": "0:25:48", "throughput": 5699.45, "total_tokens": 13317304} {"current_steps": 20405, "total_steps": 33920, "loss": 0.3609, "lr": 4.105421929255729e-06, "epoch": 12.03125, "percentage": 60.16, "elapsed_time": "0:38:57", "remaining_time": "0:25:47", "throughput": 5699.56, "total_tokens": 13320536} {"current_steps": 20410, "total_steps": 33920, "loss": 0.382, "lr": 4.102890845905854e-06, "epoch": 12.034198113207546, "percentage": 60.17, "elapsed_time": "0:38:57", "remaining_time": "0:25:47", "throughput": 5699.71, "total_tokens": 13323896} {"current_steps": 20415, "total_steps": 33920, "loss": 0.2472, "lr": 4.1003600000694935e-06, "epoch": 12.037146226415095, "percentage": 60.19, "elapsed_time": "0:38:58", "remaining_time": "0:25:46", "throughput": 5699.96, "total_tokens": 13328152} {"current_steps": 20420, "total_steps": 33920, "loss": 0.2954, "lr": 4.0978293924167e-06, "epoch": 12.040094339622641, "percentage": 60.2, "elapsed_time": "0:38:58", "remaining_time": "0:25:46", "throughput": 5700.06, "total_tokens": 13331448} {"current_steps": 20425, "total_steps": 33920, "loss": 0.2799, "lr": 4.095299023617461e-06, "epoch": 12.04304245283019, "percentage": 60.22, "elapsed_time": "0:38:59", "remaining_time": "0:25:45", "throughput": 5700.23, "total_tokens": 13335736} {"current_steps": 20430, "total_steps": 33920, "loss": 0.3648, "lr": 4.092768894341707e-06, "epoch": 12.045990566037736, "percentage": 60.23, "elapsed_time": "0:39:00", "remaining_time": "0:25:45", "throughput": 5700.29, "total_tokens": 13338776} {"current_steps": 20435, "total_steps": 33920, "loss": 0.3692, "lr": 4.090239005259298e-06, "epoch": 12.048938679245284, "percentage": 60.24, "elapsed_time": "0:39:00", "remaining_time": "0:25:44", "throughput": 5700.17, "total_tokens": 13341656} {"current_steps": 20440, "total_steps": 33920, "loss": 0.4255, "lr": 4.087709357040033e-06, "epoch": 12.05188679245283, "percentage": 60.26, "elapsed_time": "0:39:01", "remaining_time": "0:25:43", "throughput": 5700.12, "total_tokens": 13344376} {"current_steps": 20445, "total_steps": 33920, "loss": 0.415, "lr": 4.085179950353648e-06, "epoch": 12.054834905660377, "percentage": 60.27, "elapsed_time": "0:39:01", "remaining_time": "0:25:43", "throughput": 5700.42, "total_tokens": 13349592} {"current_steps": 20450, "total_steps": 33920, "loss": 0.348, "lr": 4.0826507858698135e-06, "epoch": 12.057783018867925, "percentage": 60.29, "elapsed_time": "0:39:02", "remaining_time": "0:25:42", "throughput": 5700.51, "total_tokens": 13352632} {"current_steps": 20455, "total_steps": 33920, "loss": 0.4618, "lr": 4.080121864258136e-06, "epoch": 12.060731132075471, "percentage": 60.3, "elapsed_time": "0:39:02", "remaining_time": "0:25:42", "throughput": 5700.67, "total_tokens": 13356184} {"current_steps": 20460, "total_steps": 33920, "loss": 0.2893, "lr": 4.077593186188161e-06, "epoch": 12.06367924528302, "percentage": 60.32, "elapsed_time": "0:39:03", "remaining_time": "0:25:41", "throughput": 5700.77, "total_tokens": 13359448} {"current_steps": 20465, "total_steps": 33920, "loss": 0.4575, "lr": 4.075064752329364e-06, "epoch": 12.066627358490566, "percentage": 60.33, "elapsed_time": "0:39:03", "remaining_time": "0:25:41", "throughput": 5700.72, "total_tokens": 13362136} {"current_steps": 20470, "total_steps": 33920, "loss": 0.3701, "lr": 4.0725365633511605e-06, "epoch": 12.069575471698114, "percentage": 60.35, "elapsed_time": "0:39:04", "remaining_time": "0:25:40", "throughput": 5700.62, "total_tokens": 13364952} {"current_steps": 20475, "total_steps": 33920, "loss": 0.4149, "lr": 4.070008619922899e-06, "epoch": 12.07252358490566, "percentage": 60.36, "elapsed_time": "0:39:05", "remaining_time": "0:25:39", "throughput": 5700.75, "total_tokens": 13368504} {"current_steps": 20480, "total_steps": 33920, "loss": 0.4641, "lr": 4.067480922713864e-06, "epoch": 12.075471698113208, "percentage": 60.38, "elapsed_time": "0:39:05", "remaining_time": "0:25:39", "throughput": 5700.85, "total_tokens": 13371704} {"current_steps": 20485, "total_steps": 33920, "loss": 0.359, "lr": 4.064953472393273e-06, "epoch": 12.078419811320755, "percentage": 60.39, "elapsed_time": "0:39:06", "remaining_time": "0:25:38", "throughput": 5700.91, "total_tokens": 13374904} {"current_steps": 20490, "total_steps": 33920, "loss": 0.3922, "lr": 4.06242626963028e-06, "epoch": 12.081367924528301, "percentage": 60.41, "elapsed_time": "0:39:06", "remaining_time": "0:25:38", "throughput": 5701.02, "total_tokens": 13378296} {"current_steps": 20495, "total_steps": 33920, "loss": 0.2894, "lr": 4.059899315093972e-06, "epoch": 12.08431603773585, "percentage": 60.42, "elapsed_time": "0:39:07", "remaining_time": "0:25:37", "throughput": 5700.83, "total_tokens": 13380696} {"current_steps": 20500, "total_steps": 33920, "loss": 0.2079, "lr": 4.057372609453374e-06, "epoch": 12.087264150943396, "percentage": 60.44, "elapsed_time": "0:39:07", "remaining_time": "0:25:36", "throughput": 5700.76, "total_tokens": 13383512} {"current_steps": 20505, "total_steps": 33920, "loss": 0.2893, "lr": 4.054846153377439e-06, "epoch": 12.090212264150944, "percentage": 60.45, "elapsed_time": "0:39:08", "remaining_time": "0:25:36", "throughput": 5700.66, "total_tokens": 13386072} {"current_steps": 20510, "total_steps": 33920, "loss": 0.328, "lr": 4.052319947535058e-06, "epoch": 12.09316037735849, "percentage": 60.47, "elapsed_time": "0:39:08", "remaining_time": "0:25:35", "throughput": 5700.8, "total_tokens": 13389496} {"current_steps": 20515, "total_steps": 33920, "loss": 0.2193, "lr": 4.049793992595056e-06, "epoch": 12.096108490566039, "percentage": 60.48, "elapsed_time": "0:39:09", "remaining_time": "0:25:35", "throughput": 5700.87, "total_tokens": 13392824} {"current_steps": 20520, "total_steps": 33920, "loss": 0.434, "lr": 4.047268289226187e-06, "epoch": 12.099056603773585, "percentage": 60.5, "elapsed_time": "0:39:09", "remaining_time": "0:25:34", "throughput": 5700.89, "total_tokens": 13396248} {"current_steps": 20525, "total_steps": 33920, "loss": 0.3271, "lr": 4.044742838097147e-06, "epoch": 12.102004716981131, "percentage": 60.51, "elapsed_time": "0:39:10", "remaining_time": "0:25:34", "throughput": 5701.12, "total_tokens": 13400696} {"current_steps": 20530, "total_steps": 33920, "loss": 0.3603, "lr": 4.0422176398765564e-06, "epoch": 12.10495283018868, "percentage": 60.52, "elapsed_time": "0:39:11", "remaining_time": "0:25:33", "throughput": 5701.04, "total_tokens": 13403416} {"current_steps": 20535, "total_steps": 33920, "loss": 0.3258, "lr": 4.039692695232975e-06, "epoch": 12.107900943396226, "percentage": 60.54, "elapsed_time": "0:39:11", "remaining_time": "0:25:32", "throughput": 5700.93, "total_tokens": 13406232} {"current_steps": 20540, "total_steps": 33920, "loss": 0.4166, "lr": 4.03716800483489e-06, "epoch": 12.110849056603774, "percentage": 60.55, "elapsed_time": "0:39:12", "remaining_time": "0:25:32", "throughput": 5700.93, "total_tokens": 13409592} {"current_steps": 20545, "total_steps": 33920, "loss": 0.4068, "lr": 4.034643569350726e-06, "epoch": 12.11379716981132, "percentage": 60.57, "elapsed_time": "0:39:12", "remaining_time": "0:25:31", "throughput": 5700.93, "total_tokens": 13412600} {"current_steps": 20550, "total_steps": 33920, "loss": 0.3674, "lr": 4.032119389448837e-06, "epoch": 12.116745283018869, "percentage": 60.58, "elapsed_time": "0:39:13", "remaining_time": "0:25:31", "throughput": 5701.02, "total_tokens": 13415704} {"current_steps": 20555, "total_steps": 33920, "loss": 0.3078, "lr": 4.0295954657975115e-06, "epoch": 12.119693396226415, "percentage": 60.6, "elapsed_time": "0:39:13", "remaining_time": "0:25:30", "throughput": 5701.0, "total_tokens": 13418488} {"current_steps": 20560, "total_steps": 33920, "loss": 0.4106, "lr": 4.027071799064968e-06, "epoch": 12.122641509433961, "percentage": 60.61, "elapsed_time": "0:39:14", "remaining_time": "0:25:29", "throughput": 5701.23, "total_tokens": 13422328} {"current_steps": 20565, "total_steps": 33920, "loss": 0.4722, "lr": 4.02454838991936e-06, "epoch": 12.12558962264151, "percentage": 60.63, "elapsed_time": "0:39:14", "remaining_time": "0:25:29", "throughput": 5701.29, "total_tokens": 13425624} {"current_steps": 20570, "total_steps": 33920, "loss": 0.4135, "lr": 4.022025239028768e-06, "epoch": 12.128537735849056, "percentage": 60.64, "elapsed_time": "0:39:15", "remaining_time": "0:25:28", "throughput": 5701.25, "total_tokens": 13428760} {"current_steps": 20575, "total_steps": 33920, "loss": 0.3318, "lr": 4.0195023470612095e-06, "epoch": 12.131485849056604, "percentage": 60.66, "elapsed_time": "0:39:15", "remaining_time": "0:25:28", "throughput": 5701.0, "total_tokens": 13431224} {"current_steps": 20580, "total_steps": 33920, "loss": 0.3496, "lr": 4.016979714684631e-06, "epoch": 12.13443396226415, "percentage": 60.67, "elapsed_time": "0:39:16", "remaining_time": "0:25:27", "throughput": 5700.72, "total_tokens": 13433464} {"current_steps": 20585, "total_steps": 33920, "loss": 0.3823, "lr": 4.014457342566909e-06, "epoch": 12.137382075471699, "percentage": 60.69, "elapsed_time": "0:39:16", "remaining_time": "0:25:26", "throughput": 5700.72, "total_tokens": 13436280} {"current_steps": 20590, "total_steps": 33920, "loss": 0.2917, "lr": 4.011935231375853e-06, "epoch": 12.140330188679245, "percentage": 60.7, "elapsed_time": "0:39:17", "remaining_time": "0:25:26", "throughput": 5700.56, "total_tokens": 13438808} {"current_steps": 20595, "total_steps": 33920, "loss": 0.4555, "lr": 4.009413381779203e-06, "epoch": 12.143278301886792, "percentage": 60.72, "elapsed_time": "0:39:17", "remaining_time": "0:25:25", "throughput": 5700.48, "total_tokens": 13441592} {"current_steps": 20600, "total_steps": 33920, "loss": 0.3184, "lr": 4.00689179444463e-06, "epoch": 12.14622641509434, "percentage": 60.73, "elapsed_time": "0:39:18", "remaining_time": "0:25:25", "throughput": 5700.47, "total_tokens": 13444728} {"current_steps": 20605, "total_steps": 33920, "loss": 0.335, "lr": 4.004370470039733e-06, "epoch": 12.149174528301886, "percentage": 60.75, "elapsed_time": "0:39:19", "remaining_time": "0:25:24", "throughput": 5700.58, "total_tokens": 13448280} {"current_steps": 20610, "total_steps": 33920, "loss": 0.3919, "lr": 4.001849409232046e-06, "epoch": 12.152122641509434, "percentage": 60.76, "elapsed_time": "0:39:19", "remaining_time": "0:25:23", "throughput": 5700.62, "total_tokens": 13451256} {"current_steps": 20615, "total_steps": 33920, "loss": 0.2797, "lr": 3.9993286126890274e-06, "epoch": 12.15507075471698, "percentage": 60.78, "elapsed_time": "0:39:20", "remaining_time": "0:25:23", "throughput": 5700.6, "total_tokens": 13454232} {"current_steps": 20620, "total_steps": 33920, "loss": 0.3011, "lr": 3.996808081078074e-06, "epoch": 12.158018867924529, "percentage": 60.79, "elapsed_time": "0:39:20", "remaining_time": "0:25:22", "throughput": 5700.6, "total_tokens": 13457464} {"current_steps": 20625, "total_steps": 33920, "loss": 0.2561, "lr": 3.9942878150665035e-06, "epoch": 12.160966981132075, "percentage": 60.8, "elapsed_time": "0:39:21", "remaining_time": "0:25:22", "throughput": 5700.62, "total_tokens": 13460728} {"current_steps": 20630, "total_steps": 33920, "loss": 0.3655, "lr": 3.991767815321569e-06, "epoch": 12.163915094339623, "percentage": 60.82, "elapsed_time": "0:39:21", "remaining_time": "0:25:21", "throughput": 5700.72, "total_tokens": 13464280} {"current_steps": 20635, "total_steps": 33920, "loss": 0.4409, "lr": 3.9892480825104504e-06, "epoch": 12.16686320754717, "percentage": 60.83, "elapsed_time": "0:39:22", "remaining_time": "0:25:20", "throughput": 5700.77, "total_tokens": 13467640} {"current_steps": 20640, "total_steps": 33920, "loss": 0.3553, "lr": 3.986728617300257e-06, "epoch": 12.169811320754716, "percentage": 60.85, "elapsed_time": "0:39:22", "remaining_time": "0:25:20", "throughput": 5700.74, "total_tokens": 13470424} {"current_steps": 20645, "total_steps": 33920, "loss": 0.3627, "lr": 3.984209420358031e-06, "epoch": 12.172759433962264, "percentage": 60.86, "elapsed_time": "0:39:23", "remaining_time": "0:25:19", "throughput": 5700.67, "total_tokens": 13473240} {"current_steps": 20650, "total_steps": 33920, "loss": 0.4265, "lr": 3.981690492350738e-06, "epoch": 12.17570754716981, "percentage": 60.88, "elapsed_time": "0:39:24", "remaining_time": "0:25:19", "throughput": 5700.65, "total_tokens": 13476984} {"current_steps": 20655, "total_steps": 33920, "loss": 0.3657, "lr": 3.979171833945276e-06, "epoch": 12.178655660377359, "percentage": 60.89, "elapsed_time": "0:39:24", "remaining_time": "0:25:18", "throughput": 5700.8, "total_tokens": 13480632} {"current_steps": 20660, "total_steps": 33920, "loss": 0.4206, "lr": 3.97665344580847e-06, "epoch": 12.181603773584905, "percentage": 60.91, "elapsed_time": "0:39:25", "remaining_time": "0:25:18", "throughput": 5700.92, "total_tokens": 13484696} {"current_steps": 20665, "total_steps": 33920, "loss": 0.2996, "lr": 3.974135328607075e-06, "epoch": 12.184551886792454, "percentage": 60.92, "elapsed_time": "0:39:25", "remaining_time": "0:25:17", "throughput": 5700.84, "total_tokens": 13488056} {"current_steps": 20670, "total_steps": 33920, "loss": 0.3679, "lr": 3.971617483007773e-06, "epoch": 12.1875, "percentage": 60.94, "elapsed_time": "0:39:26", "remaining_time": "0:25:17", "throughput": 5700.91, "total_tokens": 13491576} {"current_steps": 20675, "total_steps": 33920, "loss": 0.3933, "lr": 3.969099909677174e-06, "epoch": 12.190448113207546, "percentage": 60.95, "elapsed_time": "0:39:27", "remaining_time": "0:25:16", "throughput": 5700.67, "total_tokens": 13493816} {"current_steps": 20680, "total_steps": 33920, "loss": 0.2716, "lr": 3.9665826092818165e-06, "epoch": 12.193396226415095, "percentage": 60.97, "elapsed_time": "0:39:27", "remaining_time": "0:25:15", "throughput": 5700.6, "total_tokens": 13496600} {"current_steps": 20685, "total_steps": 33920, "loss": 0.3145, "lr": 3.964065582488168e-06, "epoch": 12.196344339622641, "percentage": 60.98, "elapsed_time": "0:39:28", "remaining_time": "0:25:15", "throughput": 5700.61, "total_tokens": 13499608} {"current_steps": 20690, "total_steps": 33920, "loss": 0.3863, "lr": 3.961548829962622e-06, "epoch": 12.19929245283019, "percentage": 61.0, "elapsed_time": "0:39:28", "remaining_time": "0:25:14", "throughput": 5700.64, "total_tokens": 13502712} {"current_steps": 20695, "total_steps": 33920, "loss": 0.3898, "lr": 3.959032352371496e-06, "epoch": 12.202240566037736, "percentage": 61.01, "elapsed_time": "0:39:29", "remaining_time": "0:25:14", "throughput": 5700.64, "total_tokens": 13505848} {"current_steps": 20700, "total_steps": 33920, "loss": 0.3046, "lr": 3.956516150381043e-06, "epoch": 12.205188679245284, "percentage": 61.03, "elapsed_time": "0:39:29", "remaining_time": "0:25:13", "throughput": 5700.48, "total_tokens": 13508344} {"current_steps": 20705, "total_steps": 33920, "loss": 0.3733, "lr": 3.954000224657436e-06, "epoch": 12.20813679245283, "percentage": 61.04, "elapsed_time": "0:39:30", "remaining_time": "0:25:12", "throughput": 5700.19, "total_tokens": 13510840} {"current_steps": 20710, "total_steps": 33920, "loss": 0.2855, "lr": 3.951484575866776e-06, "epoch": 12.211084905660377, "percentage": 61.06, "elapsed_time": "0:39:30", "remaining_time": "0:25:12", "throughput": 5700.27, "total_tokens": 13514072} {"current_steps": 20715, "total_steps": 33920, "loss": 0.3604, "lr": 3.948969204675096e-06, "epoch": 12.214033018867925, "percentage": 61.07, "elapsed_time": "0:39:31", "remaining_time": "0:25:11", "throughput": 5700.15, "total_tokens": 13516856} {"current_steps": 20720, "total_steps": 33920, "loss": 0.3176, "lr": 3.946454111748346e-06, "epoch": 12.216981132075471, "percentage": 61.08, "elapsed_time": "0:39:31", "remaining_time": "0:25:11", "throughput": 5700.41, "total_tokens": 13521144} {"current_steps": 20725, "total_steps": 33920, "loss": 0.3252, "lr": 3.943939297752413e-06, "epoch": 12.21992924528302, "percentage": 61.1, "elapsed_time": "0:39:32", "remaining_time": "0:25:10", "throughput": 5700.71, "total_tokens": 13525336} {"current_steps": 20730, "total_steps": 33920, "loss": 0.4091, "lr": 3.9414247633531e-06, "epoch": 12.222877358490566, "percentage": 61.11, "elapsed_time": "0:39:33", "remaining_time": "0:25:09", "throughput": 5700.62, "total_tokens": 13528312} {"current_steps": 20735, "total_steps": 33920, "loss": 0.3953, "lr": 3.9389105092161454e-06, "epoch": 12.225825471698114, "percentage": 61.13, "elapsed_time": "0:39:33", "remaining_time": "0:25:09", "throughput": 5700.25, "total_tokens": 13530616} {"current_steps": 20740, "total_steps": 33920, "loss": 0.3276, "lr": 3.936396536007205e-06, "epoch": 12.22877358490566, "percentage": 61.14, "elapsed_time": "0:39:34", "remaining_time": "0:25:08", "throughput": 5700.41, "total_tokens": 13534328} {"current_steps": 20745, "total_steps": 33920, "loss": 0.3409, "lr": 3.933882844391866e-06, "epoch": 12.231721698113208, "percentage": 61.16, "elapsed_time": "0:39:34", "remaining_time": "0:25:08", "throughput": 5700.4, "total_tokens": 13537336} {"current_steps": 20750, "total_steps": 33920, "loss": 0.294, "lr": 3.931369435035639e-06, "epoch": 12.234669811320755, "percentage": 61.17, "elapsed_time": "0:39:35", "remaining_time": "0:25:07", "throughput": 5700.22, "total_tokens": 13539800} {"current_steps": 20755, "total_steps": 33920, "loss": 0.3727, "lr": 3.92885630860396e-06, "epoch": 12.237617924528301, "percentage": 61.19, "elapsed_time": "0:39:35", "remaining_time": "0:25:07", "throughput": 5700.19, "total_tokens": 13542680} {"current_steps": 20760, "total_steps": 33920, "loss": 0.392, "lr": 3.926343465762189e-06, "epoch": 12.24056603773585, "percentage": 61.2, "elapsed_time": "0:39:36", "remaining_time": "0:25:06", "throughput": 5699.9, "total_tokens": 13545080} {"current_steps": 20765, "total_steps": 33920, "loss": 0.3523, "lr": 3.923830907175613e-06, "epoch": 12.243514150943396, "percentage": 61.22, "elapsed_time": "0:39:36", "remaining_time": "0:25:05", "throughput": 5700.07, "total_tokens": 13548984} {"current_steps": 20770, "total_steps": 33920, "loss": 0.2164, "lr": 3.921318633509442e-06, "epoch": 12.246462264150944, "percentage": 61.23, "elapsed_time": "0:39:37", "remaining_time": "0:25:05", "throughput": 5700.12, "total_tokens": 13552312} {"current_steps": 20775, "total_steps": 33920, "loss": 0.3877, "lr": 3.918806645428811e-06, "epoch": 12.24941037735849, "percentage": 61.25, "elapsed_time": "0:39:38", "remaining_time": "0:25:04", "throughput": 5700.39, "total_tokens": 13556600} {"current_steps": 20780, "total_steps": 33920, "loss": 0.4143, "lr": 3.916294943598781e-06, "epoch": 12.252358490566039, "percentage": 61.26, "elapsed_time": "0:39:38", "remaining_time": "0:25:04", "throughput": 5700.36, "total_tokens": 13559448} {"current_steps": 20785, "total_steps": 33920, "loss": 0.4822, "lr": 3.913783528684336e-06, "epoch": 12.255306603773585, "percentage": 61.28, "elapsed_time": "0:39:39", "remaining_time": "0:25:03", "throughput": 5700.42, "total_tokens": 13562936} {"current_steps": 20790, "total_steps": 33920, "loss": 0.3081, "lr": 3.911272401350381e-06, "epoch": 12.258254716981131, "percentage": 61.29, "elapsed_time": "0:39:39", "remaining_time": "0:25:03", "throughput": 5700.49, "total_tokens": 13566328} {"current_steps": 20795, "total_steps": 33920, "loss": 0.3079, "lr": 3.9087615622617525e-06, "epoch": 12.26120283018868, "percentage": 61.31, "elapsed_time": "0:39:40", "remaining_time": "0:25:02", "throughput": 5700.54, "total_tokens": 13569592} {"current_steps": 20800, "total_steps": 33920, "loss": 0.3767, "lr": 3.906251012083202e-06, "epoch": 12.264150943396226, "percentage": 61.32, "elapsed_time": "0:39:40", "remaining_time": "0:25:01", "throughput": 5700.58, "total_tokens": 13572760} {"current_steps": 20805, "total_steps": 33920, "loss": 0.353, "lr": 3.9037407514794085e-06, "epoch": 12.267099056603774, "percentage": 61.34, "elapsed_time": "0:39:41", "remaining_time": "0:25:01", "throughput": 5700.58, "total_tokens": 13576184} {"current_steps": 20810, "total_steps": 33920, "loss": 0.4948, "lr": 3.901230781114976e-06, "epoch": 12.27004716981132, "percentage": 61.35, "elapsed_time": "0:39:42", "remaining_time": "0:25:00", "throughput": 5700.58, "total_tokens": 13579512} {"current_steps": 20815, "total_steps": 33920, "loss": 0.3364, "lr": 3.898721101654431e-06, "epoch": 12.272995283018869, "percentage": 61.36, "elapsed_time": "0:39:42", "remaining_time": "0:25:00", "throughput": 5700.64, "total_tokens": 13582680} {"current_steps": 20820, "total_steps": 33920, "loss": 0.3751, "lr": 3.896211713762221e-06, "epoch": 12.275943396226415, "percentage": 61.38, "elapsed_time": "0:39:43", "remaining_time": "0:24:59", "throughput": 5700.7, "total_tokens": 13585976} {"current_steps": 20825, "total_steps": 33920, "loss": 0.4929, "lr": 3.893702618102715e-06, "epoch": 12.278891509433961, "percentage": 61.39, "elapsed_time": "0:39:43", "remaining_time": "0:24:58", "throughput": 5700.62, "total_tokens": 13588728} {"current_steps": 20830, "total_steps": 33920, "loss": 0.3092, "lr": 3.891193815340211e-06, "epoch": 12.28183962264151, "percentage": 61.41, "elapsed_time": "0:39:44", "remaining_time": "0:24:58", "throughput": 5700.41, "total_tokens": 13591512} {"current_steps": 20835, "total_steps": 33920, "loss": 0.4348, "lr": 3.888685306138922e-06, "epoch": 12.284787735849056, "percentage": 61.42, "elapsed_time": "0:39:44", "remaining_time": "0:24:57", "throughput": 5700.61, "total_tokens": 13595352} {"current_steps": 20840, "total_steps": 33920, "loss": 0.3387, "lr": 3.886177091162987e-06, "epoch": 12.287735849056604, "percentage": 61.44, "elapsed_time": "0:39:45", "remaining_time": "0:24:57", "throughput": 5700.75, "total_tokens": 13599064} {"current_steps": 20845, "total_steps": 33920, "loss": 0.2732, "lr": 3.883669171076468e-06, "epoch": 12.29068396226415, "percentage": 61.45, "elapsed_time": "0:39:46", "remaining_time": "0:24:56", "throughput": 5700.78, "total_tokens": 13602296} {"current_steps": 20850, "total_steps": 33920, "loss": 0.3853, "lr": 3.881161546543348e-06, "epoch": 12.293632075471699, "percentage": 61.47, "elapsed_time": "0:39:46", "remaining_time": "0:24:56", "throughput": 5700.84, "total_tokens": 13605720} {"current_steps": 20855, "total_steps": 33920, "loss": 0.4167, "lr": 3.8786542182275295e-06, "epoch": 12.296580188679245, "percentage": 61.48, "elapsed_time": "0:39:47", "remaining_time": "0:24:55", "throughput": 5700.8, "total_tokens": 13608664} {"current_steps": 20860, "total_steps": 33920, "loss": 0.409, "lr": 3.87614718679284e-06, "epoch": 12.299528301886792, "percentage": 61.5, "elapsed_time": "0:39:47", "remaining_time": "0:24:54", "throughput": 5700.9, "total_tokens": 13611992} {"current_steps": 20865, "total_steps": 33920, "loss": 0.4036, "lr": 3.8736404529030255e-06, "epoch": 12.30247641509434, "percentage": 61.51, "elapsed_time": "0:39:48", "remaining_time": "0:24:54", "throughput": 5701.15, "total_tokens": 13616184} {"current_steps": 20870, "total_steps": 33920, "loss": 0.3698, "lr": 3.871134017221756e-06, "epoch": 12.305424528301886, "percentage": 61.53, "elapsed_time": "0:39:48", "remaining_time": "0:24:53", "throughput": 5701.11, "total_tokens": 13619096} {"current_steps": 20875, "total_steps": 33920, "loss": 0.481, "lr": 3.868627880412621e-06, "epoch": 12.308372641509434, "percentage": 61.54, "elapsed_time": "0:39:49", "remaining_time": "0:24:53", "throughput": 5701.12, "total_tokens": 13622008} {"current_steps": 20880, "total_steps": 33920, "loss": 0.277, "lr": 3.86612204313913e-06, "epoch": 12.31132075471698, "percentage": 61.56, "elapsed_time": "0:39:49", "remaining_time": "0:24:52", "throughput": 5701.34, "total_tokens": 13625976} {"current_steps": 20885, "total_steps": 33920, "loss": 0.3385, "lr": 3.863616506064714e-06, "epoch": 12.314268867924529, "percentage": 61.57, "elapsed_time": "0:39:50", "remaining_time": "0:24:51", "throughput": 5701.39, "total_tokens": 13629272} {"current_steps": 20890, "total_steps": 33920, "loss": 0.2594, "lr": 3.861111269852727e-06, "epoch": 12.317216981132075, "percentage": 61.59, "elapsed_time": "0:39:51", "remaining_time": "0:24:51", "throughput": 5701.4, "total_tokens": 13632376} {"current_steps": 20895, "total_steps": 33920, "loss": 0.337, "lr": 3.858606335166439e-06, "epoch": 12.320165094339623, "percentage": 61.6, "elapsed_time": "0:39:51", "remaining_time": "0:24:50", "throughput": 5701.46, "total_tokens": 13635352} {"current_steps": 20900, "total_steps": 33920, "loss": 0.3032, "lr": 3.8561017026690415e-06, "epoch": 12.32311320754717, "percentage": 61.62, "elapsed_time": "0:39:52", "remaining_time": "0:24:50", "throughput": 5701.45, "total_tokens": 13638456} {"current_steps": 20905, "total_steps": 33920, "loss": 0.3073, "lr": 3.8535973730236495e-06, "epoch": 12.326061320754716, "percentage": 61.63, "elapsed_time": "0:39:52", "remaining_time": "0:24:49", "throughput": 5701.28, "total_tokens": 13640856} {"current_steps": 20910, "total_steps": 33920, "loss": 0.3552, "lr": 3.851093346893294e-06, "epoch": 12.329009433962264, "percentage": 61.65, "elapsed_time": "0:39:53", "remaining_time": "0:24:49", "throughput": 5701.24, "total_tokens": 13644152} {"current_steps": 20915, "total_steps": 33920, "loss": 0.3963, "lr": 3.848589624940927e-06, "epoch": 12.33195754716981, "percentage": 61.66, "elapsed_time": "0:39:53", "remaining_time": "0:24:48", "throughput": 5701.29, "total_tokens": 13647320} {"current_steps": 20920, "total_steps": 33920, "loss": 0.3738, "lr": 3.846086207829417e-06, "epoch": 12.334905660377359, "percentage": 61.67, "elapsed_time": "0:39:54", "remaining_time": "0:24:47", "throughput": 5701.27, "total_tokens": 13650328} {"current_steps": 20925, "total_steps": 33920, "loss": 0.4254, "lr": 3.843583096221559e-06, "epoch": 12.337853773584905, "percentage": 61.69, "elapsed_time": "0:39:54", "remaining_time": "0:24:47", "throughput": 5701.34, "total_tokens": 13653688} {"current_steps": 20930, "total_steps": 33920, "loss": 0.4677, "lr": 3.8410802907800596e-06, "epoch": 12.340801886792454, "percentage": 61.7, "elapsed_time": "0:39:55", "remaining_time": "0:24:46", "throughput": 5701.28, "total_tokens": 13657048} {"current_steps": 20935, "total_steps": 33920, "loss": 0.4233, "lr": 3.838577792167546e-06, "epoch": 12.34375, "percentage": 61.72, "elapsed_time": "0:39:56", "remaining_time": "0:24:46", "throughput": 5701.43, "total_tokens": 13660920} {"current_steps": 20940, "total_steps": 33920, "loss": 0.395, "lr": 3.836075601046569e-06, "epoch": 12.346698113207546, "percentage": 61.73, "elapsed_time": "0:39:56", "remaining_time": "0:24:45", "throughput": 5701.42, "total_tokens": 13663896} {"current_steps": 20945, "total_steps": 33920, "loss": 0.4834, "lr": 3.833573718079594e-06, "epoch": 12.349646226415095, "percentage": 61.75, "elapsed_time": "0:39:57", "remaining_time": "0:24:44", "throughput": 5701.55, "total_tokens": 13667192} {"current_steps": 20950, "total_steps": 33920, "loss": 0.3511, "lr": 3.831072143929002e-06, "epoch": 12.352594339622641, "percentage": 61.76, "elapsed_time": "0:39:57", "remaining_time": "0:24:44", "throughput": 5701.53, "total_tokens": 13669976} {"current_steps": 20955, "total_steps": 33920, "loss": 0.4502, "lr": 3.828570879257098e-06, "epoch": 12.35554245283019, "percentage": 61.78, "elapsed_time": "0:39:58", "remaining_time": "0:24:43", "throughput": 5701.45, "total_tokens": 13672728} {"current_steps": 20960, "total_steps": 33920, "loss": 0.3107, "lr": 3.826069924726102e-06, "epoch": 12.358490566037736, "percentage": 61.79, "elapsed_time": "0:39:58", "remaining_time": "0:24:43", "throughput": 5701.5, "total_tokens": 13676056} {"current_steps": 20965, "total_steps": 33920, "loss": 0.4432, "lr": 3.823569280998154e-06, "epoch": 12.361438679245284, "percentage": 61.81, "elapsed_time": "0:39:59", "remaining_time": "0:24:42", "throughput": 5701.38, "total_tokens": 13679032} {"current_steps": 20970, "total_steps": 33920, "loss": 0.3114, "lr": 3.8210689487353095e-06, "epoch": 12.36438679245283, "percentage": 61.82, "elapsed_time": "0:39:59", "remaining_time": "0:24:41", "throughput": 5701.34, "total_tokens": 13682040} {"current_steps": 20975, "total_steps": 33920, "loss": 0.371, "lr": 3.818568928599539e-06, "epoch": 12.367334905660377, "percentage": 61.84, "elapsed_time": "0:40:00", "remaining_time": "0:24:41", "throughput": 5701.24, "total_tokens": 13684984} {"current_steps": 20980, "total_steps": 33920, "loss": 0.2964, "lr": 3.816069221252739e-06, "epoch": 12.370283018867925, "percentage": 61.85, "elapsed_time": "0:40:00", "remaining_time": "0:24:40", "throughput": 5701.14, "total_tokens": 13687832} {"current_steps": 20985, "total_steps": 33920, "loss": 0.2916, "lr": 3.813569827356715e-06, "epoch": 12.373231132075471, "percentage": 61.87, "elapsed_time": "0:40:01", "remaining_time": "0:24:40", "throughput": 5701.35, "total_tokens": 13692472} {"current_steps": 20990, "total_steps": 33920, "loss": 0.2198, "lr": 3.811070747573191e-06, "epoch": 12.37617924528302, "percentage": 61.88, "elapsed_time": "0:40:02", "remaining_time": "0:24:40", "throughput": 5701.54, "total_tokens": 13698392} {"current_steps": 20995, "total_steps": 33920, "loss": 0.302, "lr": 3.8085719825638098e-06, "epoch": 12.379127358490566, "percentage": 61.9, "elapsed_time": "0:40:03", "remaining_time": "0:24:39", "throughput": 5701.66, "total_tokens": 13702424} {"current_steps": 21000, "total_steps": 33920, "loss": 0.3146, "lr": 3.806073532990132e-06, "epoch": 12.382075471698114, "percentage": 61.91, "elapsed_time": "0:40:03", "remaining_time": "0:24:38", "throughput": 5701.56, "total_tokens": 13705240} {"current_steps": 21005, "total_steps": 33920, "loss": 0.3507, "lr": 3.8035753995136333e-06, "epoch": 12.38502358490566, "percentage": 61.93, "elapsed_time": "0:40:04", "remaining_time": "0:24:38", "throughput": 5701.66, "total_tokens": 13708664} {"current_steps": 21010, "total_steps": 33920, "loss": 0.2927, "lr": 3.801077582795702e-06, "epoch": 12.387971698113208, "percentage": 61.94, "elapsed_time": "0:40:04", "remaining_time": "0:24:37", "throughput": 5701.7, "total_tokens": 13711992} {"current_steps": 21015, "total_steps": 33920, "loss": 0.2707, "lr": 3.7985800834976494e-06, "epoch": 12.390919811320755, "percentage": 61.95, "elapsed_time": "0:40:05", "remaining_time": "0:24:37", "throughput": 5701.65, "total_tokens": 13714648} {"current_steps": 21020, "total_steps": 33920, "loss": 0.2912, "lr": 3.7960829022806965e-06, "epoch": 12.393867924528301, "percentage": 61.97, "elapsed_time": "0:40:05", "remaining_time": "0:24:36", "throughput": 5701.68, "total_tokens": 13717880} {"current_steps": 21025, "total_steps": 33920, "loss": 0.3051, "lr": 3.793586039805984e-06, "epoch": 12.39681603773585, "percentage": 61.98, "elapsed_time": "0:40:06", "remaining_time": "0:24:35", "throughput": 5701.62, "total_tokens": 13720600} {"current_steps": 21030, "total_steps": 33920, "loss": 0.3643, "lr": 3.791089496734567e-06, "epoch": 12.399764150943396, "percentage": 62.0, "elapsed_time": "0:40:06", "remaining_time": "0:24:35", "throughput": 5701.69, "total_tokens": 13723800} {"current_steps": 21035, "total_steps": 33920, "loss": 0.3376, "lr": 3.7885932737274163e-06, "epoch": 12.402712264150944, "percentage": 62.01, "elapsed_time": "0:40:07", "remaining_time": "0:24:34", "throughput": 5701.71, "total_tokens": 13727032} {"current_steps": 21040, "total_steps": 33920, "loss": 0.3379, "lr": 3.7860973714454156e-06, "epoch": 12.40566037735849, "percentage": 62.03, "elapsed_time": "0:40:08", "remaining_time": "0:24:34", "throughput": 5701.72, "total_tokens": 13730040} {"current_steps": 21045, "total_steps": 33920, "loss": 0.3424, "lr": 3.7836017905493695e-06, "epoch": 12.408608490566039, "percentage": 62.04, "elapsed_time": "0:40:08", "remaining_time": "0:24:33", "throughput": 5701.76, "total_tokens": 13733560} {"current_steps": 21050, "total_steps": 33920, "loss": 0.3554, "lr": 3.7811065316999908e-06, "epoch": 12.411556603773585, "percentage": 62.06, "elapsed_time": "0:40:09", "remaining_time": "0:24:33", "throughput": 5701.88, "total_tokens": 13737080} {"current_steps": 21055, "total_steps": 33920, "loss": 0.4199, "lr": 3.7786115955579105e-06, "epoch": 12.414504716981131, "percentage": 62.07, "elapsed_time": "0:40:09", "remaining_time": "0:24:32", "throughput": 5702.09, "total_tokens": 13741432} {"current_steps": 21060, "total_steps": 33920, "loss": 0.3953, "lr": 3.7761169827836746e-06, "epoch": 12.41745283018868, "percentage": 62.09, "elapsed_time": "0:40:11", "remaining_time": "0:24:32", "throughput": 5702.57, "total_tokens": 13749272} {"current_steps": 21065, "total_steps": 33920, "loss": 0.3446, "lr": 3.773622694037743e-06, "epoch": 12.420400943396226, "percentage": 62.1, "elapsed_time": "0:40:11", "remaining_time": "0:24:31", "throughput": 5702.59, "total_tokens": 13752312} {"current_steps": 21070, "total_steps": 33920, "loss": 0.4225, "lr": 3.7711287299804865e-06, "epoch": 12.423349056603774, "percentage": 62.12, "elapsed_time": "0:40:12", "remaining_time": "0:24:31", "throughput": 5702.77, "total_tokens": 13756088} {"current_steps": 21075, "total_steps": 33920, "loss": 0.3629, "lr": 3.768635091272197e-06, "epoch": 12.42629716981132, "percentage": 62.13, "elapsed_time": "0:40:12", "remaining_time": "0:24:30", "throughput": 5702.75, "total_tokens": 13759192} {"current_steps": 21080, "total_steps": 33920, "loss": 0.3697, "lr": 3.7661417785730732e-06, "epoch": 12.429245283018869, "percentage": 62.15, "elapsed_time": "0:40:13", "remaining_time": "0:24:29", "throughput": 5702.81, "total_tokens": 13762392} {"current_steps": 21085, "total_steps": 33920, "loss": 0.4001, "lr": 3.7636487925432304e-06, "epoch": 12.432193396226415, "percentage": 62.16, "elapsed_time": "0:40:13", "remaining_time": "0:24:29", "throughput": 5702.76, "total_tokens": 13765560} {"current_steps": 21090, "total_steps": 33920, "loss": 0.3054, "lr": 3.761156133842697e-06, "epoch": 12.435141509433961, "percentage": 62.18, "elapsed_time": "0:40:14", "remaining_time": "0:24:28", "throughput": 5702.75, "total_tokens": 13768792} {"current_steps": 21095, "total_steps": 33920, "loss": 0.2721, "lr": 3.7586638031314182e-06, "epoch": 12.43808962264151, "percentage": 62.19, "elapsed_time": "0:40:14", "remaining_time": "0:24:28", "throughput": 5702.61, "total_tokens": 13771544} {"current_steps": 21100, "total_steps": 33920, "loss": 0.2734, "lr": 3.7561718010692477e-06, "epoch": 12.441037735849056, "percentage": 62.21, "elapsed_time": "0:40:15", "remaining_time": "0:24:27", "throughput": 5702.51, "total_tokens": 13774264} {"current_steps": 21105, "total_steps": 33920, "loss": 0.45, "lr": 3.7536801283159523e-06, "epoch": 12.443985849056604, "percentage": 62.22, "elapsed_time": "0:40:15", "remaining_time": "0:24:26", "throughput": 5702.48, "total_tokens": 13777176} {"current_steps": 21110, "total_steps": 33920, "loss": 0.3517, "lr": 3.7511887855312155e-06, "epoch": 12.44693396226415, "percentage": 62.23, "elapsed_time": "0:40:16", "remaining_time": "0:24:26", "throughput": 5702.32, "total_tokens": 13779640} {"current_steps": 21115, "total_steps": 33920, "loss": 0.2688, "lr": 3.74869777337463e-06, "epoch": 12.449882075471699, "percentage": 62.25, "elapsed_time": "0:40:17", "remaining_time": "0:24:25", "throughput": 5702.36, "total_tokens": 13782872} {"current_steps": 21120, "total_steps": 33920, "loss": 0.3517, "lr": 3.7462070925057004e-06, "epoch": 12.452830188679245, "percentage": 62.26, "elapsed_time": "0:40:17", "remaining_time": "0:24:25", "throughput": 5702.7, "total_tokens": 13787512} {"current_steps": 21125, "total_steps": 33920, "loss": 0.2963, "lr": 3.7437167435838472e-06, "epoch": 12.455778301886792, "percentage": 62.28, "elapsed_time": "0:40:18", "remaining_time": "0:24:24", "throughput": 5702.76, "total_tokens": 13790584} {"current_steps": 21130, "total_steps": 33920, "loss": 0.4306, "lr": 3.741226727268401e-06, "epoch": 12.45872641509434, "percentage": 62.29, "elapsed_time": "0:40:18", "remaining_time": "0:24:24", "throughput": 5702.9, "total_tokens": 13793976} {"current_steps": 21135, "total_steps": 33920, "loss": 0.3287, "lr": 3.7387370442186027e-06, "epoch": 12.461674528301886, "percentage": 62.31, "elapsed_time": "0:40:19", "remaining_time": "0:24:23", "throughput": 5702.96, "total_tokens": 13797528} {"current_steps": 21140, "total_steps": 33920, "loss": 0.3129, "lr": 3.736247695093609e-06, "epoch": 12.464622641509434, "percentage": 62.32, "elapsed_time": "0:40:19", "remaining_time": "0:24:22", "throughput": 5703.01, "total_tokens": 13800696} {"current_steps": 21145, "total_steps": 33920, "loss": 0.3624, "lr": 3.7337586805524838e-06, "epoch": 12.46757075471698, "percentage": 62.34, "elapsed_time": "0:40:20", "remaining_time": "0:24:22", "throughput": 5703.17, "total_tokens": 13804312} {"current_steps": 21150, "total_steps": 33920, "loss": 0.3027, "lr": 3.731270001254205e-06, "epoch": 12.470518867924529, "percentage": 62.35, "elapsed_time": "0:40:20", "remaining_time": "0:24:21", "throughput": 5703.11, "total_tokens": 13807096} {"current_steps": 21155, "total_steps": 33920, "loss": 0.3137, "lr": 3.728781657857661e-06, "epoch": 12.473466981132075, "percentage": 62.37, "elapsed_time": "0:40:21", "remaining_time": "0:24:21", "throughput": 5703.2, "total_tokens": 13810744} {"current_steps": 21160, "total_steps": 33920, "loss": 0.3676, "lr": 3.726293651021653e-06, "epoch": 12.476415094339623, "percentage": 62.38, "elapsed_time": "0:40:22", "remaining_time": "0:24:20", "throughput": 5703.27, "total_tokens": 13814296} {"current_steps": 21165, "total_steps": 33920, "loss": 0.2998, "lr": 3.7238059814048888e-06, "epoch": 12.47936320754717, "percentage": 62.4, "elapsed_time": "0:40:22", "remaining_time": "0:24:20", "throughput": 5703.21, "total_tokens": 13817112} {"current_steps": 21170, "total_steps": 33920, "loss": 0.4281, "lr": 3.7213186496659916e-06, "epoch": 12.482311320754716, "percentage": 62.41, "elapsed_time": "0:40:23", "remaining_time": "0:24:19", "throughput": 5703.1, "total_tokens": 13819832} {"current_steps": 21175, "total_steps": 33920, "loss": 0.4268, "lr": 3.718831656463493e-06, "epoch": 12.485259433962264, "percentage": 62.43, "elapsed_time": "0:40:23", "remaining_time": "0:24:18", "throughput": 5702.94, "total_tokens": 13822712} {"current_steps": 21180, "total_steps": 33920, "loss": 0.3813, "lr": 3.7163450024558345e-06, "epoch": 12.48820754716981, "percentage": 62.44, "elapsed_time": "0:40:24", "remaining_time": "0:24:18", "throughput": 5702.89, "total_tokens": 13825624} {"current_steps": 21185, "total_steps": 33920, "loss": 0.2945, "lr": 3.7138586883013694e-06, "epoch": 12.491155660377359, "percentage": 62.46, "elapsed_time": "0:40:24", "remaining_time": "0:24:17", "throughput": 5702.82, "total_tokens": 13828440} {"current_steps": 21190, "total_steps": 33920, "loss": 0.325, "lr": 3.7113727146583573e-06, "epoch": 12.494103773584905, "percentage": 62.47, "elapsed_time": "0:40:25", "remaining_time": "0:24:17", "throughput": 5702.79, "total_tokens": 13831544} {"current_steps": 21195, "total_steps": 33920, "loss": 0.4517, "lr": 3.7088870821849748e-06, "epoch": 12.497051886792454, "percentage": 62.49, "elapsed_time": "0:40:25", "remaining_time": "0:24:16", "throughput": 5702.79, "total_tokens": 13834520} {"current_steps": 21200, "total_steps": 33920, "loss": 0.4052, "lr": 3.706401791539301e-06, "epoch": 12.5, "percentage": 62.5, "elapsed_time": "0:40:26", "remaining_time": "0:24:15", "throughput": 5702.9, "total_tokens": 13838040} {"current_steps": 21205, "total_steps": 33920, "loss": 0.3706, "lr": 3.703916843379328e-06, "epoch": 12.502948113207546, "percentage": 62.51, "elapsed_time": "0:40:27", "remaining_time": "0:24:15", "throughput": 5703.02, "total_tokens": 13841688} {"current_steps": 21210, "total_steps": 33920, "loss": 0.265, "lr": 3.7014322383629575e-06, "epoch": 12.505896226415095, "percentage": 62.53, "elapsed_time": "0:40:27", "remaining_time": "0:24:14", "throughput": 5703.14, "total_tokens": 13845144} {"current_steps": 21215, "total_steps": 33920, "loss": 0.4326, "lr": 3.6989479771479976e-06, "epoch": 12.508844339622641, "percentage": 62.54, "elapsed_time": "0:40:28", "remaining_time": "0:24:14", "throughput": 5703.1, "total_tokens": 13847928} {"current_steps": 21220, "total_steps": 33920, "loss": 0.3763, "lr": 3.696464060392169e-06, "epoch": 12.51179245283019, "percentage": 62.56, "elapsed_time": "0:40:28", "remaining_time": "0:24:13", "throughput": 5703.18, "total_tokens": 13851320} {"current_steps": 21225, "total_steps": 33920, "loss": 0.2907, "lr": 3.6939804887530962e-06, "epoch": 12.514740566037736, "percentage": 62.57, "elapsed_time": "0:40:29", "remaining_time": "0:24:12", "throughput": 5703.27, "total_tokens": 13854520} {"current_steps": 21230, "total_steps": 33920, "loss": 0.4019, "lr": 3.6914972628883196e-06, "epoch": 12.517688679245284, "percentage": 62.59, "elapsed_time": "0:40:29", "remaining_time": "0:24:12", "throughput": 5703.36, "total_tokens": 13858648} {"current_steps": 21235, "total_steps": 33920, "loss": 0.347, "lr": 3.6890143834552814e-06, "epoch": 12.52063679245283, "percentage": 62.6, "elapsed_time": "0:40:30", "remaining_time": "0:24:11", "throughput": 5703.39, "total_tokens": 13861880} {"current_steps": 21240, "total_steps": 33920, "loss": 0.3717, "lr": 3.6865318511113347e-06, "epoch": 12.523584905660378, "percentage": 62.62, "elapsed_time": "0:40:30", "remaining_time": "0:24:11", "throughput": 5703.2, "total_tokens": 13864376} {"current_steps": 21245, "total_steps": 33920, "loss": 0.2905, "lr": 3.684049666513742e-06, "epoch": 12.526533018867925, "percentage": 62.63, "elapsed_time": "0:40:31", "remaining_time": "0:24:10", "throughput": 5703.18, "total_tokens": 13867288} {"current_steps": 21250, "total_steps": 33920, "loss": 0.3394, "lr": 3.6815678303196715e-06, "epoch": 12.529481132075471, "percentage": 62.65, "elapsed_time": "0:40:32", "remaining_time": "0:24:10", "throughput": 5703.17, "total_tokens": 13870264} {"current_steps": 21255, "total_steps": 33920, "loss": 0.278, "lr": 3.6790863431861988e-06, "epoch": 12.53242924528302, "percentage": 62.66, "elapsed_time": "0:40:32", "remaining_time": "0:24:09", "throughput": 5703.33, "total_tokens": 13874360} {"current_steps": 21260, "total_steps": 33920, "loss": 0.4347, "lr": 3.676605205770311e-06, "epoch": 12.535377358490566, "percentage": 62.68, "elapsed_time": "0:40:33", "remaining_time": "0:24:08", "throughput": 5703.1, "total_tokens": 13876664} {"current_steps": 21265, "total_steps": 33920, "loss": 0.3338, "lr": 3.674124418728898e-06, "epoch": 12.538325471698114, "percentage": 62.69, "elapsed_time": "0:40:33", "remaining_time": "0:24:08", "throughput": 5703.16, "total_tokens": 13880088} {"current_steps": 21270, "total_steps": 33920, "loss": 0.3735, "lr": 3.671643982718759e-06, "epoch": 12.54127358490566, "percentage": 62.71, "elapsed_time": "0:40:34", "remaining_time": "0:24:07", "throughput": 5703.18, "total_tokens": 13883160} {"current_steps": 21275, "total_steps": 33920, "loss": 0.3897, "lr": 3.6691638983966017e-06, "epoch": 12.544221698113208, "percentage": 62.72, "elapsed_time": "0:40:34", "remaining_time": "0:24:07", "throughput": 5703.3, "total_tokens": 13886648} {"current_steps": 21280, "total_steps": 33920, "loss": 0.4713, "lr": 3.666684166419037e-06, "epoch": 12.547169811320755, "percentage": 62.74, "elapsed_time": "0:40:35", "remaining_time": "0:24:06", "throughput": 5703.27, "total_tokens": 13889656} {"current_steps": 21285, "total_steps": 33920, "loss": 0.2621, "lr": 3.6642047874425833e-06, "epoch": 12.550117924528301, "percentage": 62.75, "elapsed_time": "0:40:35", "remaining_time": "0:24:06", "throughput": 5703.34, "total_tokens": 13893144} {"current_steps": 21290, "total_steps": 33920, "loss": 0.3365, "lr": 3.661725762123671e-06, "epoch": 12.55306603773585, "percentage": 62.77, "elapsed_time": "0:40:36", "remaining_time": "0:24:05", "throughput": 5703.34, "total_tokens": 13896056} {"current_steps": 21295, "total_steps": 33920, "loss": 0.3294, "lr": 3.659247091118631e-06, "epoch": 12.556014150943396, "percentage": 62.78, "elapsed_time": "0:40:37", "remaining_time": "0:24:04", "throughput": 5703.04, "total_tokens": 13898360} {"current_steps": 21300, "total_steps": 33920, "loss": 0.2824, "lr": 3.6567687750837027e-06, "epoch": 12.558962264150944, "percentage": 62.79, "elapsed_time": "0:40:37", "remaining_time": "0:24:04", "throughput": 5703.05, "total_tokens": 13901464} {"current_steps": 21305, "total_steps": 33920, "loss": 0.3537, "lr": 3.6542908146750287e-06, "epoch": 12.56191037735849, "percentage": 62.81, "elapsed_time": "0:40:38", "remaining_time": "0:24:03", "throughput": 5703.12, "total_tokens": 13904504} {"current_steps": 21310, "total_steps": 33920, "loss": 0.2647, "lr": 3.6518132105486624e-06, "epoch": 12.564858490566039, "percentage": 62.82, "elapsed_time": "0:40:38", "remaining_time": "0:24:03", "throughput": 5703.09, "total_tokens": 13907896} {"current_steps": 21315, "total_steps": 33920, "loss": 0.4073, "lr": 3.649335963360559e-06, "epoch": 12.567806603773585, "percentage": 62.84, "elapsed_time": "0:40:39", "remaining_time": "0:24:02", "throughput": 5703.11, "total_tokens": 13911320} {"current_steps": 21320, "total_steps": 33920, "loss": 0.3035, "lr": 3.6468590737665795e-06, "epoch": 12.570754716981131, "percentage": 62.85, "elapsed_time": "0:40:39", "remaining_time": "0:24:01", "throughput": 5703.24, "total_tokens": 13915000} {"current_steps": 21325, "total_steps": 33920, "loss": 0.4027, "lr": 3.6443825424224926e-06, "epoch": 12.57370283018868, "percentage": 62.87, "elapsed_time": "0:40:40", "remaining_time": "0:24:01", "throughput": 5703.09, "total_tokens": 13917560} {"current_steps": 21330, "total_steps": 33920, "loss": 0.2905, "lr": 3.64190636998397e-06, "epoch": 12.576650943396226, "percentage": 62.88, "elapsed_time": "0:40:40", "remaining_time": "0:24:00", "throughput": 5702.94, "total_tokens": 13920120} {"current_steps": 21335, "total_steps": 33920, "loss": 0.3219, "lr": 3.639430557106588e-06, "epoch": 12.579599056603774, "percentage": 62.9, "elapsed_time": "0:40:41", "remaining_time": "0:24:00", "throughput": 5702.9, "total_tokens": 13923032} {"current_steps": 21340, "total_steps": 33920, "loss": 0.3395, "lr": 3.6369551044458314e-06, "epoch": 12.58254716981132, "percentage": 62.91, "elapsed_time": "0:40:41", "remaining_time": "0:23:59", "throughput": 5703.06, "total_tokens": 13926840} {"current_steps": 21345, "total_steps": 33920, "loss": 0.4165, "lr": 3.6344800126570846e-06, "epoch": 12.585495283018869, "percentage": 62.93, "elapsed_time": "0:40:42", "remaining_time": "0:23:58", "throughput": 5702.91, "total_tokens": 13929400} {"current_steps": 21350, "total_steps": 33920, "loss": 0.2435, "lr": 3.6320052823956385e-06, "epoch": 12.588443396226415, "percentage": 62.94, "elapsed_time": "0:40:43", "remaining_time": "0:23:58", "throughput": 5702.86, "total_tokens": 13932120} {"current_steps": 21355, "total_steps": 33920, "loss": 0.234, "lr": 3.6295309143166906e-06, "epoch": 12.591391509433961, "percentage": 62.96, "elapsed_time": "0:40:43", "remaining_time": "0:23:57", "throughput": 5702.8, "total_tokens": 13935064} {"current_steps": 21360, "total_steps": 33920, "loss": 0.3314, "lr": 3.62705690907534e-06, "epoch": 12.59433962264151, "percentage": 62.97, "elapsed_time": "0:40:44", "remaining_time": "0:23:57", "throughput": 5702.87, "total_tokens": 13938584} {"current_steps": 21365, "total_steps": 33920, "loss": 0.3161, "lr": 3.624583267326588e-06, "epoch": 12.597287735849056, "percentage": 62.99, "elapsed_time": "0:40:44", "remaining_time": "0:23:56", "throughput": 5702.88, "total_tokens": 13941656} {"current_steps": 21370, "total_steps": 33920, "loss": 0.3433, "lr": 3.6221099897253454e-06, "epoch": 12.600235849056604, "percentage": 63.0, "elapsed_time": "0:40:45", "remaining_time": "0:23:55", "throughput": 5702.84, "total_tokens": 13944472} {"current_steps": 21375, "total_steps": 33920, "loss": 0.3209, "lr": 3.619637076926421e-06, "epoch": 12.60318396226415, "percentage": 63.02, "elapsed_time": "0:40:45", "remaining_time": "0:23:55", "throughput": 5702.81, "total_tokens": 13947512} {"current_steps": 21380, "total_steps": 33920, "loss": 0.3816, "lr": 3.617164529584528e-06, "epoch": 12.606132075471699, "percentage": 63.03, "elapsed_time": "0:40:46", "remaining_time": "0:23:54", "throughput": 5702.84, "total_tokens": 13950808} {"current_steps": 21385, "total_steps": 33920, "loss": 0.2666, "lr": 3.614692348354286e-06, "epoch": 12.609080188679245, "percentage": 63.05, "elapsed_time": "0:40:46", "remaining_time": "0:23:54", "throughput": 5702.89, "total_tokens": 13954072} {"current_steps": 21390, "total_steps": 33920, "loss": 0.3719, "lr": 3.612220533890216e-06, "epoch": 12.612028301886792, "percentage": 63.06, "elapsed_time": "0:40:47", "remaining_time": "0:23:53", "throughput": 5702.88, "total_tokens": 13957016} {"current_steps": 21395, "total_steps": 33920, "loss": 0.2846, "lr": 3.609749086846741e-06, "epoch": 12.61497641509434, "percentage": 63.07, "elapsed_time": "0:40:47", "remaining_time": "0:23:53", "throughput": 5702.84, "total_tokens": 13960024} {"current_steps": 21400, "total_steps": 33920, "loss": 0.3851, "lr": 3.607278007878186e-06, "epoch": 12.617924528301886, "percentage": 63.09, "elapsed_time": "0:40:48", "remaining_time": "0:23:52", "throughput": 5702.93, "total_tokens": 13963320} {"current_steps": 21405, "total_steps": 33920, "loss": 0.3583, "lr": 3.6048072976387817e-06, "epoch": 12.620872641509434, "percentage": 63.1, "elapsed_time": "0:40:48", "remaining_time": "0:23:51", "throughput": 5702.99, "total_tokens": 13966424} {"current_steps": 21410, "total_steps": 33920, "loss": 0.3542, "lr": 3.6023369567826585e-06, "epoch": 12.62382075471698, "percentage": 63.12, "elapsed_time": "0:40:49", "remaining_time": "0:23:51", "throughput": 5703.03, "total_tokens": 13969688} {"current_steps": 21415, "total_steps": 33920, "loss": 0.3137, "lr": 3.599866985963848e-06, "epoch": 12.626768867924529, "percentage": 63.13, "elapsed_time": "0:40:50", "remaining_time": "0:23:50", "throughput": 5703.33, "total_tokens": 13975928} {"current_steps": 21420, "total_steps": 33920, "loss": 0.3308, "lr": 3.5973973858362885e-06, "epoch": 12.629716981132075, "percentage": 63.15, "elapsed_time": "0:40:50", "remaining_time": "0:23:50", "throughput": 5703.45, "total_tokens": 13979128} {"current_steps": 21425, "total_steps": 33920, "loss": 0.3491, "lr": 3.594928157053816e-06, "epoch": 12.632665094339622, "percentage": 63.16, "elapsed_time": "0:40:51", "remaining_time": "0:23:49", "throughput": 5703.62, "total_tokens": 13982488} {"current_steps": 21430, "total_steps": 33920, "loss": 0.283, "lr": 3.592459300270168e-06, "epoch": 12.63561320754717, "percentage": 63.18, "elapsed_time": "0:40:52", "remaining_time": "0:23:49", "throughput": 5703.81, "total_tokens": 13986232} {"current_steps": 21435, "total_steps": 33920, "loss": 0.3874, "lr": 3.589990816138988e-06, "epoch": 12.638561320754716, "percentage": 63.19, "elapsed_time": "0:40:52", "remaining_time": "0:23:48", "throughput": 5703.73, "total_tokens": 13989016} {"current_steps": 21440, "total_steps": 33920, "loss": 0.3531, "lr": 3.587522705313816e-06, "epoch": 12.641509433962264, "percentage": 63.21, "elapsed_time": "0:40:53", "remaining_time": "0:23:48", "throughput": 5704.4, "total_tokens": 13998008} {"current_steps": 21445, "total_steps": 33920, "loss": 0.3027, "lr": 3.585054968448094e-06, "epoch": 12.64445754716981, "percentage": 63.22, "elapsed_time": "0:40:54", "remaining_time": "0:23:47", "throughput": 5704.45, "total_tokens": 14001240} {"current_steps": 21450, "total_steps": 33920, "loss": 0.4439, "lr": 3.5825876061951686e-06, "epoch": 12.647405660377359, "percentage": 63.24, "elapsed_time": "0:40:54", "remaining_time": "0:23:47", "throughput": 5704.35, "total_tokens": 14004024} {"current_steps": 21455, "total_steps": 33920, "loss": 0.2395, "lr": 3.5801206192082818e-06, "epoch": 12.650353773584905, "percentage": 63.25, "elapsed_time": "0:40:55", "remaining_time": "0:23:46", "throughput": 5704.22, "total_tokens": 14006712} {"current_steps": 21460, "total_steps": 33920, "loss": 0.3093, "lr": 3.577654008140582e-06, "epoch": 12.653301886792454, "percentage": 63.27, "elapsed_time": "0:40:56", "remaining_time": "0:23:46", "throughput": 5704.27, "total_tokens": 14010648} {"current_steps": 21465, "total_steps": 33920, "loss": 0.2982, "lr": 3.5751877736451123e-06, "epoch": 12.65625, "percentage": 63.28, "elapsed_time": "0:40:56", "remaining_time": "0:23:45", "throughput": 5703.96, "total_tokens": 14013080} {"current_steps": 21470, "total_steps": 33920, "loss": 0.3245, "lr": 3.5727219163748205e-06, "epoch": 12.659198113207546, "percentage": 63.3, "elapsed_time": "0:40:57", "remaining_time": "0:23:44", "throughput": 5703.85, "total_tokens": 14016088} {"current_steps": 21475, "total_steps": 33920, "loss": 0.3602, "lr": 3.570256436982552e-06, "epoch": 12.662146226415095, "percentage": 63.31, "elapsed_time": "0:40:57", "remaining_time": "0:23:44", "throughput": 5703.61, "total_tokens": 14018392} {"current_steps": 21480, "total_steps": 33920, "loss": 0.3106, "lr": 3.5677913361210536e-06, "epoch": 12.665094339622641, "percentage": 63.33, "elapsed_time": "0:40:58", "remaining_time": "0:23:43", "throughput": 5703.56, "total_tokens": 14021560} {"current_steps": 21485, "total_steps": 33920, "loss": 0.3472, "lr": 3.565326614442972e-06, "epoch": 12.66804245283019, "percentage": 63.34, "elapsed_time": "0:40:58", "remaining_time": "0:23:43", "throughput": 5703.75, "total_tokens": 14025176} {"current_steps": 21490, "total_steps": 33920, "loss": 0.3692, "lr": 3.5628622726008523e-06, "epoch": 12.670990566037736, "percentage": 63.35, "elapsed_time": "0:40:59", "remaining_time": "0:23:42", "throughput": 5703.77, "total_tokens": 14028408} {"current_steps": 21495, "total_steps": 33920, "loss": 0.4373, "lr": 3.56039831124714e-06, "epoch": 12.673938679245284, "percentage": 63.37, "elapsed_time": "0:41:00", "remaining_time": "0:23:42", "throughput": 5703.86, "total_tokens": 14032024} {"current_steps": 21500, "total_steps": 33920, "loss": 0.27, "lr": 3.557934731034179e-06, "epoch": 12.67688679245283, "percentage": 63.38, "elapsed_time": "0:41:00", "remaining_time": "0:23:41", "throughput": 5703.69, "total_tokens": 14034456} {"current_steps": 21505, "total_steps": 33920, "loss": 0.352, "lr": 3.5554715326142126e-06, "epoch": 12.679834905660378, "percentage": 63.4, "elapsed_time": "0:41:01", "remaining_time": "0:23:40", "throughput": 5703.87, "total_tokens": 14038584} {"current_steps": 21510, "total_steps": 33920, "loss": 0.2779, "lr": 3.553008716639384e-06, "epoch": 12.682783018867925, "percentage": 63.41, "elapsed_time": "0:41:01", "remaining_time": "0:23:40", "throughput": 5703.77, "total_tokens": 14041272} {"current_steps": 21515, "total_steps": 33920, "loss": 0.3029, "lr": 3.5505462837617338e-06, "epoch": 12.685731132075471, "percentage": 63.43, "elapsed_time": "0:41:02", "remaining_time": "0:23:39", "throughput": 5704.03, "total_tokens": 14045272} {"current_steps": 21520, "total_steps": 33920, "loss": 0.3017, "lr": 3.5480842346332013e-06, "epoch": 12.68867924528302, "percentage": 63.44, "elapsed_time": "0:41:02", "remaining_time": "0:23:39", "throughput": 5704.05, "total_tokens": 14048280} {"current_steps": 21525, "total_steps": 33920, "loss": 0.3993, "lr": 3.5456225699056256e-06, "epoch": 12.691627358490566, "percentage": 63.46, "elapsed_time": "0:41:03", "remaining_time": "0:23:38", "throughput": 5704.29, "total_tokens": 14052184} {"current_steps": 21530, "total_steps": 33920, "loss": 0.3501, "lr": 3.5431612902307426e-06, "epoch": 12.694575471698114, "percentage": 63.47, "elapsed_time": "0:41:04", "remaining_time": "0:23:37", "throughput": 5704.41, "total_tokens": 14055768} {"current_steps": 21535, "total_steps": 33920, "loss": 0.3326, "lr": 3.540700396260186e-06, "epoch": 12.69752358490566, "percentage": 63.49, "elapsed_time": "0:41:04", "remaining_time": "0:23:37", "throughput": 5704.07, "total_tokens": 14058072} {"current_steps": 21540, "total_steps": 33920, "loss": 0.4521, "lr": 3.538239888645489e-06, "epoch": 12.700471698113208, "percentage": 63.5, "elapsed_time": "0:41:05", "remaining_time": "0:23:37", "throughput": 5704.52, "total_tokens": 14064184} {"current_steps": 21545, "total_steps": 33920, "loss": 0.3504, "lr": 3.535779768038082e-06, "epoch": 12.703419811320755, "percentage": 63.52, "elapsed_time": "0:41:06", "remaining_time": "0:23:36", "throughput": 5704.62, "total_tokens": 14067736} {"current_steps": 21550, "total_steps": 33920, "loss": 0.2695, "lr": 3.5333200350892905e-06, "epoch": 12.706367924528301, "percentage": 63.53, "elapsed_time": "0:41:06", "remaining_time": "0:23:35", "throughput": 5704.69, "total_tokens": 14071000} {"current_steps": 21555, "total_steps": 33920, "loss": 0.4768, "lr": 3.530860690450342e-06, "epoch": 12.70931603773585, "percentage": 63.55, "elapsed_time": "0:41:07", "remaining_time": "0:23:35", "throughput": 5704.66, "total_tokens": 14073880} {"current_steps": 21560, "total_steps": 33920, "loss": 0.3675, "lr": 3.528401734772357e-06, "epoch": 12.712264150943396, "percentage": 63.56, "elapsed_time": "0:41:07", "remaining_time": "0:23:34", "throughput": 5704.53, "total_tokens": 14076440} {"current_steps": 21565, "total_steps": 33920, "loss": 0.3076, "lr": 3.5259431687063538e-06, "epoch": 12.715212264150944, "percentage": 63.58, "elapsed_time": "0:41:08", "remaining_time": "0:23:34", "throughput": 5704.53, "total_tokens": 14080056} {"current_steps": 21570, "total_steps": 33920, "loss": 0.3149, "lr": 3.523484992903249e-06, "epoch": 12.71816037735849, "percentage": 63.59, "elapsed_time": "0:41:08", "remaining_time": "0:23:33", "throughput": 5704.39, "total_tokens": 14082648} {"current_steps": 21575, "total_steps": 33920, "loss": 0.3692, "lr": 3.5210272080138573e-06, "epoch": 12.721108490566039, "percentage": 63.61, "elapsed_time": "0:41:09", "remaining_time": "0:23:32", "throughput": 5704.03, "total_tokens": 14084824} {"current_steps": 21580, "total_steps": 33920, "loss": 0.3751, "lr": 3.518569814688887e-06, "epoch": 12.724056603773585, "percentage": 63.62, "elapsed_time": "0:41:09", "remaining_time": "0:23:32", "throughput": 5704.03, "total_tokens": 14087736} {"current_steps": 21585, "total_steps": 33920, "loss": 0.3009, "lr": 3.5161128135789414e-06, "epoch": 12.727004716981131, "percentage": 63.64, "elapsed_time": "0:41:10", "remaining_time": "0:23:31", "throughput": 5704.08, "total_tokens": 14090840} {"current_steps": 21590, "total_steps": 33920, "loss": 0.285, "lr": 3.513656205334525e-06, "epoch": 12.72995283018868, "percentage": 63.65, "elapsed_time": "0:41:10", "remaining_time": "0:23:31", "throughput": 5704.12, "total_tokens": 14094008} {"current_steps": 21595, "total_steps": 33920, "loss": 0.3837, "lr": 3.5111999906060336e-06, "epoch": 12.732900943396226, "percentage": 63.66, "elapsed_time": "0:41:11", "remaining_time": "0:23:30", "throughput": 5704.13, "total_tokens": 14097176} {"current_steps": 21600, "total_steps": 33920, "loss": 0.2791, "lr": 3.50874417004376e-06, "epoch": 12.735849056603774, "percentage": 63.68, "elapsed_time": "0:41:11", "remaining_time": "0:23:29", "throughput": 5704.23, "total_tokens": 14100536} {"current_steps": 21605, "total_steps": 33920, "loss": 0.344, "lr": 3.5062887442978956e-06, "epoch": 12.73879716981132, "percentage": 63.69, "elapsed_time": "0:41:12", "remaining_time": "0:23:29", "throughput": 5704.24, "total_tokens": 14103576} {"current_steps": 21610, "total_steps": 33920, "loss": 0.3228, "lr": 3.503833714018524e-06, "epoch": 12.741745283018869, "percentage": 63.71, "elapsed_time": "0:41:13", "remaining_time": "0:23:28", "throughput": 5704.28, "total_tokens": 14106872} {"current_steps": 21615, "total_steps": 33920, "loss": 0.3708, "lr": 3.5013790798556228e-06, "epoch": 12.744693396226415, "percentage": 63.72, "elapsed_time": "0:41:13", "remaining_time": "0:23:28", "throughput": 5704.44, "total_tokens": 14110712} {"current_steps": 21620, "total_steps": 33920, "loss": 0.3733, "lr": 3.4989248424590705e-06, "epoch": 12.747641509433961, "percentage": 63.74, "elapsed_time": "0:41:14", "remaining_time": "0:23:27", "throughput": 5704.45, "total_tokens": 14114008} {"current_steps": 21625, "total_steps": 33920, "loss": 0.3742, "lr": 3.4964710024786354e-06, "epoch": 12.75058962264151, "percentage": 63.75, "elapsed_time": "0:41:14", "remaining_time": "0:23:27", "throughput": 5704.48, "total_tokens": 14117112} {"current_steps": 21630, "total_steps": 33920, "loss": 0.3433, "lr": 3.4940175605639813e-06, "epoch": 12.753537735849056, "percentage": 63.77, "elapsed_time": "0:41:15", "remaining_time": "0:23:26", "throughput": 5704.44, "total_tokens": 14119896} {"current_steps": 21635, "total_steps": 33920, "loss": 0.5534, "lr": 3.4915645173646694e-06, "epoch": 12.756485849056604, "percentage": 63.78, "elapsed_time": "0:41:15", "remaining_time": "0:23:25", "throughput": 5704.31, "total_tokens": 14122840} {"current_steps": 21640, "total_steps": 33920, "loss": 0.4638, "lr": 3.489111873530153e-06, "epoch": 12.75943396226415, "percentage": 63.8, "elapsed_time": "0:41:16", "remaining_time": "0:23:25", "throughput": 5704.13, "total_tokens": 14125304} {"current_steps": 21645, "total_steps": 33920, "loss": 0.4115, "lr": 3.4866596297097776e-06, "epoch": 12.762382075471699, "percentage": 63.81, "elapsed_time": "0:41:16", "remaining_time": "0:23:24", "throughput": 5704.27, "total_tokens": 14128856} {"current_steps": 21650, "total_steps": 33920, "loss": 0.3267, "lr": 3.484207786552789e-06, "epoch": 12.765330188679245, "percentage": 63.83, "elapsed_time": "0:41:17", "remaining_time": "0:23:24", "throughput": 5704.22, "total_tokens": 14132024} {"current_steps": 21655, "total_steps": 33920, "loss": 0.3325, "lr": 3.4817563447083214e-06, "epoch": 12.768278301886792, "percentage": 63.84, "elapsed_time": "0:41:18", "remaining_time": "0:23:23", "throughput": 5704.25, "total_tokens": 14135192} {"current_steps": 21660, "total_steps": 33920, "loss": 0.3522, "lr": 3.4793053048254044e-06, "epoch": 12.77122641509434, "percentage": 63.86, "elapsed_time": "0:41:18", "remaining_time": "0:23:22", "throughput": 5704.3, "total_tokens": 14138776} {"current_steps": 21665, "total_steps": 33920, "loss": 0.3625, "lr": 3.47685466755296e-06, "epoch": 12.774174528301886, "percentage": 63.87, "elapsed_time": "0:41:19", "remaining_time": "0:23:22", "throughput": 5704.32, "total_tokens": 14142136} {"current_steps": 21670, "total_steps": 33920, "loss": 0.3591, "lr": 3.474404433539809e-06, "epoch": 12.777122641509434, "percentage": 63.89, "elapsed_time": "0:41:19", "remaining_time": "0:23:21", "throughput": 5704.36, "total_tokens": 14145400} {"current_steps": 21675, "total_steps": 33920, "loss": 0.3448, "lr": 3.4719546034346598e-06, "epoch": 12.78007075471698, "percentage": 63.9, "elapsed_time": "0:41:20", "remaining_time": "0:23:21", "throughput": 5704.42, "total_tokens": 14149016} {"current_steps": 21680, "total_steps": 33920, "loss": 0.3569, "lr": 3.4695051778861125e-06, "epoch": 12.783018867924529, "percentage": 63.92, "elapsed_time": "0:41:20", "remaining_time": "0:23:20", "throughput": 5704.46, "total_tokens": 14152088} {"current_steps": 21685, "total_steps": 33920, "loss": 0.3916, "lr": 3.4670561575426677e-06, "epoch": 12.785966981132075, "percentage": 63.93, "elapsed_time": "0:41:21", "remaining_time": "0:23:20", "throughput": 5704.29, "total_tokens": 14154840} {"current_steps": 21690, "total_steps": 33920, "loss": 0.3309, "lr": 3.4646075430527115e-06, "epoch": 12.788915094339622, "percentage": 63.94, "elapsed_time": "0:41:22", "remaining_time": "0:23:19", "throughput": 5704.29, "total_tokens": 14158392} {"current_steps": 21695, "total_steps": 33920, "loss": 0.3953, "lr": 3.4621593350645236e-06, "epoch": 12.79186320754717, "percentage": 63.96, "elapsed_time": "0:41:22", "remaining_time": "0:23:18", "throughput": 5704.24, "total_tokens": 14161560} {"current_steps": 21700, "total_steps": 33920, "loss": 0.5333, "lr": 3.4597115342262817e-06, "epoch": 12.794811320754716, "percentage": 63.97, "elapsed_time": "0:41:23", "remaining_time": "0:23:18", "throughput": 5704.3, "total_tokens": 14165272} {"current_steps": 21705, "total_steps": 33920, "loss": 0.2882, "lr": 3.4572641411860484e-06, "epoch": 12.797759433962264, "percentage": 63.99, "elapsed_time": "0:41:23", "remaining_time": "0:23:17", "throughput": 5704.22, "total_tokens": 14168312} {"current_steps": 21710, "total_steps": 33920, "loss": 0.335, "lr": 3.454817156591782e-06, "epoch": 12.80070754716981, "percentage": 64.0, "elapsed_time": "0:41:24", "remaining_time": "0:23:17", "throughput": 5704.15, "total_tokens": 14171544} {"current_steps": 21715, "total_steps": 33920, "loss": 0.3581, "lr": 3.4523705810913344e-06, "epoch": 12.803655660377359, "percentage": 64.02, "elapsed_time": "0:41:24", "remaining_time": "0:23:16", "throughput": 5703.97, "total_tokens": 14174008} {"current_steps": 21720, "total_steps": 33920, "loss": 0.298, "lr": 3.449924415332443e-06, "epoch": 12.806603773584905, "percentage": 64.03, "elapsed_time": "0:41:25", "remaining_time": "0:23:16", "throughput": 5704.01, "total_tokens": 14177560} {"current_steps": 21725, "total_steps": 33920, "loss": 0.3413, "lr": 3.447478659962745e-06, "epoch": 12.809551886792454, "percentage": 64.05, "elapsed_time": "0:41:26", "remaining_time": "0:23:15", "throughput": 5704.05, "total_tokens": 14180632} {"current_steps": 21730, "total_steps": 33920, "loss": 0.4951, "lr": 3.4450333156297625e-06, "epoch": 12.8125, "percentage": 64.06, "elapsed_time": "0:41:26", "remaining_time": "0:23:14", "throughput": 5704.04, "total_tokens": 14183960} {"current_steps": 21735, "total_steps": 33920, "loss": 0.3659, "lr": 3.44258838298091e-06, "epoch": 12.815448113207546, "percentage": 64.08, "elapsed_time": "0:41:27", "remaining_time": "0:23:14", "throughput": 5703.9, "total_tokens": 14186616} {"current_steps": 21740, "total_steps": 33920, "loss": 0.3283, "lr": 3.440143862663497e-06, "epoch": 12.818396226415095, "percentage": 64.09, "elapsed_time": "0:41:27", "remaining_time": "0:23:13", "throughput": 5703.94, "total_tokens": 14189688} {"current_steps": 21745, "total_steps": 33920, "loss": 0.2844, "lr": 3.4376997553247183e-06, "epoch": 12.821344339622641, "percentage": 64.11, "elapsed_time": "0:41:28", "remaining_time": "0:23:13", "throughput": 5703.98, "total_tokens": 14192984} {"current_steps": 21750, "total_steps": 33920, "loss": 0.3077, "lr": 3.4352560616116617e-06, "epoch": 12.82429245283019, "percentage": 64.12, "elapsed_time": "0:41:28", "remaining_time": "0:23:12", "throughput": 5704.12, "total_tokens": 14196856} {"current_steps": 21755, "total_steps": 33920, "loss": 0.5122, "lr": 3.4328127821713077e-06, "epoch": 12.827240566037736, "percentage": 64.14, "elapsed_time": "0:41:29", "remaining_time": "0:23:12", "throughput": 5704.08, "total_tokens": 14199736} {"current_steps": 21760, "total_steps": 33920, "loss": 0.301, "lr": 3.430369917650521e-06, "epoch": 12.830188679245284, "percentage": 64.15, "elapsed_time": "0:41:29", "remaining_time": "0:23:11", "throughput": 5704.13, "total_tokens": 14202872} {"current_steps": 21765, "total_steps": 33920, "loss": 0.3869, "lr": 3.427927468696066e-06, "epoch": 12.83313679245283, "percentage": 64.17, "elapsed_time": "0:41:30", "remaining_time": "0:23:10", "throughput": 5704.11, "total_tokens": 14206232} {"current_steps": 21770, "total_steps": 33920, "loss": 0.3546, "lr": 3.425485435954588e-06, "epoch": 12.836084905660378, "percentage": 64.18, "elapsed_time": "0:41:31", "remaining_time": "0:23:10", "throughput": 5704.18, "total_tokens": 14209464} {"current_steps": 21775, "total_steps": 33920, "loss": 0.3767, "lr": 3.4230438200726274e-06, "epoch": 12.839033018867925, "percentage": 64.2, "elapsed_time": "0:41:31", "remaining_time": "0:23:09", "throughput": 5704.25, "total_tokens": 14212920} {"current_steps": 21780, "total_steps": 33920, "loss": 0.356, "lr": 3.4206026216966113e-06, "epoch": 12.841981132075471, "percentage": 64.21, "elapsed_time": "0:41:32", "remaining_time": "0:23:09", "throughput": 5704.16, "total_tokens": 14215480} {"current_steps": 21785, "total_steps": 33920, "loss": 0.4151, "lr": 3.418161841472858e-06, "epoch": 12.84492924528302, "percentage": 64.22, "elapsed_time": "0:41:32", "remaining_time": "0:23:08", "throughput": 5704.14, "total_tokens": 14218488} {"current_steps": 21790, "total_steps": 33920, "loss": 0.316, "lr": 3.4157214800475746e-06, "epoch": 12.847877358490566, "percentage": 64.24, "elapsed_time": "0:41:33", "remaining_time": "0:23:07", "throughput": 5704.12, "total_tokens": 14221752} {"current_steps": 21795, "total_steps": 33920, "loss": 0.2872, "lr": 3.4132815380668577e-06, "epoch": 12.850825471698114, "percentage": 64.25, "elapsed_time": "0:41:33", "remaining_time": "0:23:07", "throughput": 5704.15, "total_tokens": 14224888} {"current_steps": 21800, "total_steps": 33920, "loss": 0.3791, "lr": 3.410842016176691e-06, "epoch": 12.85377358490566, "percentage": 64.27, "elapsed_time": "0:41:34", "remaining_time": "0:23:06", "throughput": 5704.27, "total_tokens": 14228568} {"current_steps": 21805, "total_steps": 33920, "loss": 0.2852, "lr": 3.4084029150229503e-06, "epoch": 12.856721698113208, "percentage": 64.28, "elapsed_time": "0:41:34", "remaining_time": "0:23:06", "throughput": 5704.35, "total_tokens": 14232088} {"current_steps": 21810, "total_steps": 33920, "loss": 0.3437, "lr": 3.4059642352513965e-06, "epoch": 12.859669811320755, "percentage": 64.3, "elapsed_time": "0:41:35", "remaining_time": "0:23:05", "throughput": 5704.34, "total_tokens": 14235448} {"current_steps": 21815, "total_steps": 33920, "loss": 0.3702, "lr": 3.4035259775076813e-06, "epoch": 12.862617924528301, "percentage": 64.31, "elapsed_time": "0:41:36", "remaining_time": "0:23:05", "throughput": 5704.42, "total_tokens": 14238904} {"current_steps": 21820, "total_steps": 33920, "loss": 0.2566, "lr": 3.401088142437344e-06, "epoch": 12.86556603773585, "percentage": 64.33, "elapsed_time": "0:41:36", "remaining_time": "0:23:04", "throughput": 5704.55, "total_tokens": 14242840} {"current_steps": 21825, "total_steps": 33920, "loss": 0.2887, "lr": 3.398650730685813e-06, "epoch": 12.868514150943396, "percentage": 64.34, "elapsed_time": "0:41:37", "remaining_time": "0:23:03", "throughput": 5704.43, "total_tokens": 14245496} {"current_steps": 21830, "total_steps": 33920, "loss": 0.2586, "lr": 3.396213742898401e-06, "epoch": 12.871462264150944, "percentage": 64.36, "elapsed_time": "0:41:37", "remaining_time": "0:23:03", "throughput": 5704.74, "total_tokens": 14250168} {"current_steps": 21835, "total_steps": 33920, "loss": 0.4301, "lr": 3.3937771797203134e-06, "epoch": 12.87441037735849, "percentage": 64.37, "elapsed_time": "0:41:38", "remaining_time": "0:23:02", "throughput": 5704.86, "total_tokens": 14253752} {"current_steps": 21840, "total_steps": 33920, "loss": 0.2607, "lr": 3.391341041796641e-06, "epoch": 12.877358490566039, "percentage": 64.39, "elapsed_time": "0:41:39", "remaining_time": "0:23:02", "throughput": 5704.95, "total_tokens": 14257560} {"current_steps": 21845, "total_steps": 33920, "loss": 0.2537, "lr": 3.3889053297723585e-06, "epoch": 12.880306603773585, "percentage": 64.4, "elapsed_time": "0:41:39", "remaining_time": "0:23:01", "throughput": 5705.12, "total_tokens": 14262008} {"current_steps": 21850, "total_steps": 33920, "loss": 0.288, "lr": 3.3864700442923342e-06, "epoch": 12.883254716981131, "percentage": 64.42, "elapsed_time": "0:41:40", "remaining_time": "0:23:01", "throughput": 5705.28, "total_tokens": 14265560} {"current_steps": 21855, "total_steps": 33920, "loss": 0.3272, "lr": 3.384035186001318e-06, "epoch": 12.88620283018868, "percentage": 64.43, "elapsed_time": "0:41:40", "remaining_time": "0:23:00", "throughput": 5705.16, "total_tokens": 14268536} {"current_steps": 21860, "total_steps": 33920, "loss": 0.309, "lr": 3.381600755543953e-06, "epoch": 12.889150943396226, "percentage": 64.45, "elapsed_time": "0:41:41", "remaining_time": "0:23:00", "throughput": 5704.83, "total_tokens": 14270904} {"current_steps": 21865, "total_steps": 33920, "loss": 0.3665, "lr": 3.3791667535647615e-06, "epoch": 12.892099056603774, "percentage": 64.46, "elapsed_time": "0:41:42", "remaining_time": "0:22:59", "throughput": 5704.84, "total_tokens": 14274232} {"current_steps": 21870, "total_steps": 33920, "loss": 0.3601, "lr": 3.3767331807081584e-06, "epoch": 12.89504716981132, "percentage": 64.48, "elapsed_time": "0:41:42", "remaining_time": "0:22:59", "throughput": 5705.08, "total_tokens": 14278808} {"current_steps": 21875, "total_steps": 33920, "loss": 0.2633, "lr": 3.374300037618442e-06, "epoch": 12.897995283018869, "percentage": 64.49, "elapsed_time": "0:41:43", "remaining_time": "0:22:58", "throughput": 5705.01, "total_tokens": 14281560} {"current_steps": 21880, "total_steps": 33920, "loss": 0.2684, "lr": 3.371867324939796e-06, "epoch": 12.900943396226415, "percentage": 64.5, "elapsed_time": "0:41:43", "remaining_time": "0:22:57", "throughput": 5704.98, "total_tokens": 14284760} {"current_steps": 21885, "total_steps": 33920, "loss": 0.4136, "lr": 3.369435043316293e-06, "epoch": 12.903891509433961, "percentage": 64.52, "elapsed_time": "0:41:44", "remaining_time": "0:22:57", "throughput": 5704.77, "total_tokens": 14287320} {"current_steps": 21890, "total_steps": 33920, "loss": 0.3875, "lr": 3.36700319339189e-06, "epoch": 12.90683962264151, "percentage": 64.53, "elapsed_time": "0:41:45", "remaining_time": "0:22:56", "throughput": 5704.88, "total_tokens": 14290840} {"current_steps": 21895, "total_steps": 33920, "loss": 0.3353, "lr": 3.3645717758104286e-06, "epoch": 12.909787735849056, "percentage": 64.55, "elapsed_time": "0:41:45", "remaining_time": "0:22:56", "throughput": 5705.19, "total_tokens": 14295736} {"current_steps": 21900, "total_steps": 33920, "loss": 0.3002, "lr": 3.3621407912156383e-06, "epoch": 12.912735849056604, "percentage": 64.56, "elapsed_time": "0:41:46", "remaining_time": "0:22:55", "throughput": 5705.21, "total_tokens": 14299000} {"current_steps": 21905, "total_steps": 33920, "loss": 0.3823, "lr": 3.3597102402511326e-06, "epoch": 12.91568396226415, "percentage": 64.58, "elapsed_time": "0:41:46", "remaining_time": "0:22:55", "throughput": 5705.3, "total_tokens": 14302296} {"current_steps": 21910, "total_steps": 33920, "loss": 0.302, "lr": 3.3572801235604093e-06, "epoch": 12.918632075471699, "percentage": 64.59, "elapsed_time": "0:41:47", "remaining_time": "0:22:54", "throughput": 5705.31, "total_tokens": 14305336} {"current_steps": 21915, "total_steps": 33920, "loss": 0.354, "lr": 3.3548504417868538e-06, "epoch": 12.921580188679245, "percentage": 64.61, "elapsed_time": "0:41:47", "remaining_time": "0:22:53", "throughput": 5705.45, "total_tokens": 14309240} {"current_steps": 21920, "total_steps": 33920, "loss": 0.3393, "lr": 3.352421195573734e-06, "epoch": 12.924528301886792, "percentage": 64.62, "elapsed_time": "0:41:48", "remaining_time": "0:22:53", "throughput": 5705.61, "total_tokens": 14313368} {"current_steps": 21925, "total_steps": 33920, "loss": 0.496, "lr": 3.3499923855642026e-06, "epoch": 12.92747641509434, "percentage": 64.64, "elapsed_time": "0:41:49", "remaining_time": "0:22:52", "throughput": 5705.56, "total_tokens": 14316152} {"current_steps": 21930, "total_steps": 33920, "loss": 0.3256, "lr": 3.3475640124012986e-06, "epoch": 12.930424528301886, "percentage": 64.65, "elapsed_time": "0:41:49", "remaining_time": "0:22:52", "throughput": 5705.54, "total_tokens": 14319032} {"current_steps": 21935, "total_steps": 33920, "loss": 0.3823, "lr": 3.345136076727945e-06, "epoch": 12.933372641509434, "percentage": 64.67, "elapsed_time": "0:41:50", "remaining_time": "0:22:51", "throughput": 5705.57, "total_tokens": 14322264} {"current_steps": 21940, "total_steps": 33920, "loss": 0.4122, "lr": 3.3427085791869453e-06, "epoch": 12.93632075471698, "percentage": 64.68, "elapsed_time": "0:41:50", "remaining_time": "0:22:50", "throughput": 5705.64, "total_tokens": 14325528} {"current_steps": 21945, "total_steps": 33920, "loss": 0.3185, "lr": 3.3402815204209926e-06, "epoch": 12.939268867924529, "percentage": 64.7, "elapsed_time": "0:41:51", "remaining_time": "0:22:50", "throughput": 5705.57, "total_tokens": 14328600} {"current_steps": 21950, "total_steps": 33920, "loss": 0.3109, "lr": 3.337854901072659e-06, "epoch": 12.942216981132075, "percentage": 64.71, "elapsed_time": "0:41:51", "remaining_time": "0:22:49", "throughput": 5705.54, "total_tokens": 14331832} {"current_steps": 21955, "total_steps": 33920, "loss": 0.2806, "lr": 3.3354287217844056e-06, "epoch": 12.945165094339622, "percentage": 64.73, "elapsed_time": "0:41:52", "remaining_time": "0:22:49", "throughput": 5705.33, "total_tokens": 14334328} {"current_steps": 21960, "total_steps": 33920, "loss": 0.3336, "lr": 3.3330029831985712e-06, "epoch": 12.94811320754717, "percentage": 64.74, "elapsed_time": "0:41:53", "remaining_time": "0:22:48", "throughput": 5705.25, "total_tokens": 14337816} {"current_steps": 21965, "total_steps": 33920, "loss": 0.3657, "lr": 3.330577685957382e-06, "epoch": 12.951061320754716, "percentage": 64.76, "elapsed_time": "0:41:53", "remaining_time": "0:22:48", "throughput": 5705.13, "total_tokens": 14340536} {"current_steps": 21970, "total_steps": 33920, "loss": 0.3736, "lr": 3.3281528307029454e-06, "epoch": 12.954009433962264, "percentage": 64.77, "elapsed_time": "0:41:54", "remaining_time": "0:22:47", "throughput": 5704.98, "total_tokens": 14343448} {"current_steps": 21975, "total_steps": 33920, "loss": 0.3106, "lr": 3.325728418077251e-06, "epoch": 12.95695754716981, "percentage": 64.78, "elapsed_time": "0:41:54", "remaining_time": "0:22:46", "throughput": 5705.15, "total_tokens": 14347320} {"current_steps": 21980, "total_steps": 33920, "loss": 0.3581, "lr": 3.3233044487221744e-06, "epoch": 12.959905660377359, "percentage": 64.8, "elapsed_time": "0:41:55", "remaining_time": "0:22:46", "throughput": 5705.14, "total_tokens": 14350392} {"current_steps": 21985, "total_steps": 33920, "loss": 0.356, "lr": 3.3208809232794715e-06, "epoch": 12.962853773584905, "percentage": 64.81, "elapsed_time": "0:41:55", "remaining_time": "0:22:45", "throughput": 5705.29, "total_tokens": 14354296} {"current_steps": 21990, "total_steps": 33920, "loss": 0.2802, "lr": 3.3184578423907797e-06, "epoch": 12.965801886792454, "percentage": 64.83, "elapsed_time": "0:41:56", "remaining_time": "0:22:45", "throughput": 5705.31, "total_tokens": 14357688} {"current_steps": 21995, "total_steps": 33920, "loss": 0.4164, "lr": 3.3160352066976224e-06, "epoch": 12.96875, "percentage": 64.84, "elapsed_time": "0:41:57", "remaining_time": "0:22:44", "throughput": 5705.16, "total_tokens": 14360312} {"current_steps": 22000, "total_steps": 33920, "loss": 0.4144, "lr": 3.3136130168414003e-06, "epoch": 12.971698113207546, "percentage": 64.86, "elapsed_time": "0:41:57", "remaining_time": "0:22:44", "throughput": 5705.06, "total_tokens": 14363288} {"current_steps": 22005, "total_steps": 33920, "loss": 0.2744, "lr": 3.311191273463401e-06, "epoch": 12.974646226415095, "percentage": 64.87, "elapsed_time": "0:41:58", "remaining_time": "0:22:43", "throughput": 5705.27, "total_tokens": 14367032} {"current_steps": 22010, "total_steps": 33920, "loss": 0.4209, "lr": 3.3087699772047908e-06, "epoch": 12.977594339622641, "percentage": 64.89, "elapsed_time": "0:41:58", "remaining_time": "0:22:42", "throughput": 5705.24, "total_tokens": 14370296} {"current_steps": 22015, "total_steps": 33920, "loss": 0.4005, "lr": 3.3063491287066164e-06, "epoch": 12.98054245283019, "percentage": 64.9, "elapsed_time": "0:41:59", "remaining_time": "0:22:42", "throughput": 5705.03, "total_tokens": 14372792} {"current_steps": 22020, "total_steps": 33920, "loss": 0.2704, "lr": 3.303928728609811e-06, "epoch": 12.983490566037736, "percentage": 64.92, "elapsed_time": "0:41:59", "remaining_time": "0:22:41", "throughput": 5705.11, "total_tokens": 14375928} {"current_steps": 22025, "total_steps": 33920, "loss": 0.3336, "lr": 3.3015087775551835e-06, "epoch": 12.986438679245284, "percentage": 64.93, "elapsed_time": "0:42:00", "remaining_time": "0:22:41", "throughput": 5705.29, "total_tokens": 14379608} {"current_steps": 22030, "total_steps": 33920, "loss": 0.3712, "lr": 3.299089276183427e-06, "epoch": 12.98938679245283, "percentage": 64.95, "elapsed_time": "0:42:00", "remaining_time": "0:22:40", "throughput": 5705.37, "total_tokens": 14382872} {"current_steps": 22035, "total_steps": 33920, "loss": 0.3521, "lr": 3.2966702251351157e-06, "epoch": 12.992334905660378, "percentage": 64.96, "elapsed_time": "0:42:01", "remaining_time": "0:22:40", "throughput": 5705.4, "total_tokens": 14386136} {"current_steps": 22040, "total_steps": 33920, "loss": 0.3022, "lr": 3.2942516250507035e-06, "epoch": 12.995283018867925, "percentage": 64.98, "elapsed_time": "0:42:02", "remaining_time": "0:22:39", "throughput": 5705.57, "total_tokens": 14389912} {"current_steps": 22045, "total_steps": 33920, "loss": 0.279, "lr": 3.2918334765705227e-06, "epoch": 12.998231132075471, "percentage": 64.99, "elapsed_time": "0:42:02", "remaining_time": "0:22:38", "throughput": 5705.63, "total_tokens": 14393368} {"current_steps": 22050, "total_steps": 33920, "loss": 0.2082, "lr": 3.289415780334792e-06, "epoch": 13.00117924528302, "percentage": 65.01, "elapsed_time": "0:42:03", "remaining_time": "0:22:38", "throughput": 5704.6, "total_tokens": 14396072} {"current_steps": 22055, "total_steps": 33920, "loss": 0.3529, "lr": 3.2869985369836067e-06, "epoch": 13.004127358490566, "percentage": 65.02, "elapsed_time": "0:42:04", "remaining_time": "0:22:37", "throughput": 5704.56, "total_tokens": 14398920} {"current_steps": 22060, "total_steps": 33920, "loss": 0.2676, "lr": 3.2845817471569406e-06, "epoch": 13.007075471698114, "percentage": 65.04, "elapsed_time": "0:42:04", "remaining_time": "0:22:37", "throughput": 5704.8, "total_tokens": 14403080} {"current_steps": 22065, "total_steps": 33920, "loss": 0.351, "lr": 3.28216541149465e-06, "epoch": 13.01002358490566, "percentage": 65.05, "elapsed_time": "0:42:05", "remaining_time": "0:22:36", "throughput": 5705.02, "total_tokens": 14407176} {"current_steps": 22070, "total_steps": 33920, "loss": 0.2045, "lr": 3.2797495306364707e-06, "epoch": 13.012971698113208, "percentage": 65.06, "elapsed_time": "0:42:05", "remaining_time": "0:22:36", "throughput": 5704.92, "total_tokens": 14409864} {"current_steps": 22075, "total_steps": 33920, "loss": 0.442, "lr": 3.2773341052220174e-06, "epoch": 13.015919811320755, "percentage": 65.08, "elapsed_time": "0:42:06", "remaining_time": "0:22:35", "throughput": 5704.96, "total_tokens": 14413384} {"current_steps": 22080, "total_steps": 33920, "loss": 0.449, "lr": 3.274919135890783e-06, "epoch": 13.018867924528301, "percentage": 65.09, "elapsed_time": "0:42:06", "remaining_time": "0:22:35", "throughput": 5704.76, "total_tokens": 14415912} {"current_steps": 22085, "total_steps": 33920, "loss": 0.2272, "lr": 3.2725046232821424e-06, "epoch": 13.02181603773585, "percentage": 65.11, "elapsed_time": "0:42:07", "remaining_time": "0:22:34", "throughput": 5704.65, "total_tokens": 14418792} {"current_steps": 22090, "total_steps": 33920, "loss": 0.4411, "lr": 3.270090568035348e-06, "epoch": 13.024764150943396, "percentage": 65.12, "elapsed_time": "0:42:08", "remaining_time": "0:22:33", "throughput": 5704.62, "total_tokens": 14421960} {"current_steps": 22095, "total_steps": 33920, "loss": 0.3193, "lr": 3.2676769707895306e-06, "epoch": 13.027712264150944, "percentage": 65.14, "elapsed_time": "0:42:08", "remaining_time": "0:22:33", "throughput": 5704.61, "total_tokens": 14425000} {"current_steps": 22100, "total_steps": 33920, "loss": 0.385, "lr": 3.2652638321837015e-06, "epoch": 13.03066037735849, "percentage": 65.15, "elapsed_time": "0:42:09", "remaining_time": "0:22:32", "throughput": 5704.8, "total_tokens": 14429576} {"current_steps": 22105, "total_steps": 33920, "loss": 0.3257, "lr": 3.2628511528567497e-06, "epoch": 13.033608490566039, "percentage": 65.17, "elapsed_time": "0:42:09", "remaining_time": "0:22:32", "throughput": 5704.66, "total_tokens": 14432168} {"current_steps": 22110, "total_steps": 33920, "loss": 0.3248, "lr": 3.2604389334474407e-06, "epoch": 13.036556603773585, "percentage": 65.18, "elapsed_time": "0:42:10", "remaining_time": "0:22:31", "throughput": 5704.8, "total_tokens": 14435848} {"current_steps": 22115, "total_steps": 33920, "loss": 0.412, "lr": 3.2580271745944224e-06, "epoch": 13.039504716981131, "percentage": 65.2, "elapsed_time": "0:42:11", "remaining_time": "0:22:31", "throughput": 5704.88, "total_tokens": 14439336} {"current_steps": 22120, "total_steps": 33920, "loss": 0.2168, "lr": 3.255615876936217e-06, "epoch": 13.04245283018868, "percentage": 65.21, "elapsed_time": "0:42:11", "remaining_time": "0:22:30", "throughput": 5704.95, "total_tokens": 14442568} {"current_steps": 22125, "total_steps": 33920, "loss": 0.2555, "lr": 3.2532050411112248e-06, "epoch": 13.045400943396226, "percentage": 65.23, "elapsed_time": "0:42:12", "remaining_time": "0:22:29", "throughput": 5704.95, "total_tokens": 14445736} {"current_steps": 22130, "total_steps": 33920, "loss": 0.2493, "lr": 3.2507946677577274e-06, "epoch": 13.048349056603774, "percentage": 65.24, "elapsed_time": "0:42:12", "remaining_time": "0:22:29", "throughput": 5705.15, "total_tokens": 14450152} {"current_steps": 22135, "total_steps": 33920, "loss": 0.3562, "lr": 3.2483847575138807e-06, "epoch": 13.05129716981132, "percentage": 65.26, "elapsed_time": "0:42:13", "remaining_time": "0:22:28", "throughput": 5705.22, "total_tokens": 14453672} {"current_steps": 22140, "total_steps": 33920, "loss": 0.3402, "lr": 3.245975311017716e-06, "epoch": 13.054245283018869, "percentage": 65.27, "elapsed_time": "0:42:13", "remaining_time": "0:22:28", "throughput": 5705.24, "total_tokens": 14456872} {"current_steps": 22145, "total_steps": 33920, "loss": 0.3406, "lr": 3.2435663289071486e-06, "epoch": 13.057193396226415, "percentage": 65.29, "elapsed_time": "0:42:14", "remaining_time": "0:22:27", "throughput": 5705.27, "total_tokens": 14460296} {"current_steps": 22150, "total_steps": 33920, "loss": 0.3162, "lr": 3.241157811819966e-06, "epoch": 13.060141509433961, "percentage": 65.3, "elapsed_time": "0:42:15", "remaining_time": "0:22:27", "throughput": 5705.14, "total_tokens": 14463048} {"current_steps": 22155, "total_steps": 33920, "loss": 0.3425, "lr": 3.2387497603938327e-06, "epoch": 13.06308962264151, "percentage": 65.32, "elapsed_time": "0:42:15", "remaining_time": "0:22:26", "throughput": 5705.13, "total_tokens": 14465864} {"current_steps": 22160, "total_steps": 33920, "loss": 0.4108, "lr": 3.2363421752662903e-06, "epoch": 13.066037735849056, "percentage": 65.33, "elapsed_time": "0:42:16", "remaining_time": "0:22:25", "throughput": 5705.08, "total_tokens": 14468744} {"current_steps": 22165, "total_steps": 33920, "loss": 0.2618, "lr": 3.233935057074759e-06, "epoch": 13.068985849056604, "percentage": 65.34, "elapsed_time": "0:42:16", "remaining_time": "0:22:25", "throughput": 5705.26, "total_tokens": 14472360} {"current_steps": 22170, "total_steps": 33920, "loss": 0.3395, "lr": 3.2315284064565324e-06, "epoch": 13.07193396226415, "percentage": 65.36, "elapsed_time": "0:42:17", "remaining_time": "0:22:24", "throughput": 5705.14, "total_tokens": 14474824} {"current_steps": 22175, "total_steps": 33920, "loss": 0.2309, "lr": 3.2291222240487813e-06, "epoch": 13.074882075471699, "percentage": 65.37, "elapsed_time": "0:42:17", "remaining_time": "0:22:24", "throughput": 5705.06, "total_tokens": 14477544} {"current_steps": 22180, "total_steps": 33920, "loss": 0.3505, "lr": 3.226716510488554e-06, "epoch": 13.077830188679245, "percentage": 65.39, "elapsed_time": "0:42:18", "remaining_time": "0:22:23", "throughput": 5705.19, "total_tokens": 14481224} {"current_steps": 22185, "total_steps": 33920, "loss": 0.3061, "lr": 3.224311266412773e-06, "epoch": 13.080778301886792, "percentage": 65.4, "elapsed_time": "0:42:18", "remaining_time": "0:22:22", "throughput": 5704.98, "total_tokens": 14483688} {"current_steps": 22190, "total_steps": 33920, "loss": 0.337, "lr": 3.2219064924582366e-06, "epoch": 13.08372641509434, "percentage": 65.42, "elapsed_time": "0:42:19", "remaining_time": "0:22:22", "throughput": 5705.0, "total_tokens": 14487112} {"current_steps": 22195, "total_steps": 33920, "loss": 0.3797, "lr": 3.2195021892616197e-06, "epoch": 13.086674528301886, "percentage": 65.43, "elapsed_time": "0:42:20", "remaining_time": "0:22:21", "throughput": 5705.26, "total_tokens": 14492104} {"current_steps": 22200, "total_steps": 33920, "loss": 0.3244, "lr": 3.217098357459472e-06, "epoch": 13.089622641509434, "percentage": 65.45, "elapsed_time": "0:42:20", "remaining_time": "0:22:21", "throughput": 5705.43, "total_tokens": 14496040} {"current_steps": 22205, "total_steps": 33920, "loss": 0.4146, "lr": 3.214694997688217e-06, "epoch": 13.09257075471698, "percentage": 65.46, "elapsed_time": "0:42:21", "remaining_time": "0:22:20", "throughput": 5705.38, "total_tokens": 14499432} {"current_steps": 22210, "total_steps": 33920, "loss": 0.3313, "lr": 3.2122921105841572e-06, "epoch": 13.095518867924529, "percentage": 65.48, "elapsed_time": "0:42:21", "remaining_time": "0:22:20", "throughput": 5705.43, "total_tokens": 14502664} {"current_steps": 22215, "total_steps": 33920, "loss": 0.4458, "lr": 3.2098896967834647e-06, "epoch": 13.098466981132075, "percentage": 65.49, "elapsed_time": "0:42:22", "remaining_time": "0:22:19", "throughput": 5705.59, "total_tokens": 14506440} {"current_steps": 22220, "total_steps": 33920, "loss": 0.284, "lr": 3.2074877569221896e-06, "epoch": 13.101415094339623, "percentage": 65.51, "elapsed_time": "0:42:23", "remaining_time": "0:22:19", "throughput": 5705.48, "total_tokens": 14509160} {"current_steps": 22225, "total_steps": 33920, "loss": 0.413, "lr": 3.205086291636257e-06, "epoch": 13.10436320754717, "percentage": 65.52, "elapsed_time": "0:42:23", "remaining_time": "0:22:18", "throughput": 5705.57, "total_tokens": 14512520} {"current_steps": 22230, "total_steps": 33920, "loss": 0.5629, "lr": 3.202685301561463e-06, "epoch": 13.107311320754716, "percentage": 65.54, "elapsed_time": "0:42:24", "remaining_time": "0:22:17", "throughput": 5705.83, "total_tokens": 14517096} {"current_steps": 22235, "total_steps": 33920, "loss": 0.2871, "lr": 3.200284787333482e-06, "epoch": 13.110259433962264, "percentage": 65.55, "elapsed_time": "0:42:24", "remaining_time": "0:22:17", "throughput": 5705.83, "total_tokens": 14519912} {"current_steps": 22240, "total_steps": 33920, "loss": 0.2783, "lr": 3.1978847495878595e-06, "epoch": 13.11320754716981, "percentage": 65.57, "elapsed_time": "0:42:25", "remaining_time": "0:22:16", "throughput": 5705.98, "total_tokens": 14524680} {"current_steps": 22245, "total_steps": 33920, "loss": 0.3445, "lr": 3.1954851889600176e-06, "epoch": 13.116155660377359, "percentage": 65.58, "elapsed_time": "0:42:26", "remaining_time": "0:22:16", "throughput": 5706.0, "total_tokens": 14527912} {"current_steps": 22250, "total_steps": 33920, "loss": 0.2862, "lr": 3.1930861060852485e-06, "epoch": 13.119103773584905, "percentage": 65.6, "elapsed_time": "0:42:26", "remaining_time": "0:22:15", "throughput": 5706.0, "total_tokens": 14531080} {"current_steps": 22255, "total_steps": 33920, "loss": 0.3712, "lr": 3.1906875015987194e-06, "epoch": 13.122051886792454, "percentage": 65.61, "elapsed_time": "0:42:27", "remaining_time": "0:22:15", "throughput": 5706.1, "total_tokens": 14534504} {"current_steps": 22260, "total_steps": 33920, "loss": 0.304, "lr": 3.188289376135473e-06, "epoch": 13.125, "percentage": 65.62, "elapsed_time": "0:42:27", "remaining_time": "0:22:14", "throughput": 5706.27, "total_tokens": 14538056} {"current_steps": 22265, "total_steps": 33920, "loss": 0.3575, "lr": 3.1858917303304213e-06, "epoch": 13.127948113207546, "percentage": 65.64, "elapsed_time": "0:42:28", "remaining_time": "0:22:13", "throughput": 5706.24, "total_tokens": 14540968} {"current_steps": 22270, "total_steps": 33920, "loss": 0.2763, "lr": 3.1834945648183535e-06, "epoch": 13.130896226415095, "percentage": 65.65, "elapsed_time": "0:42:28", "remaining_time": "0:22:13", "throughput": 5706.36, "total_tokens": 14544520} {"current_steps": 22275, "total_steps": 33920, "loss": 0.3363, "lr": 3.1810978802339283e-06, "epoch": 13.133844339622641, "percentage": 65.67, "elapsed_time": "0:42:29", "remaining_time": "0:22:12", "throughput": 5706.23, "total_tokens": 14547176} {"current_steps": 22280, "total_steps": 33920, "loss": 0.3015, "lr": 3.1787016772116767e-06, "epoch": 13.13679245283019, "percentage": 65.68, "elapsed_time": "0:42:30", "remaining_time": "0:22:12", "throughput": 5706.65, "total_tokens": 14552840} {"current_steps": 22285, "total_steps": 33920, "loss": 0.3367, "lr": 3.1763059563860073e-06, "epoch": 13.139740566037736, "percentage": 65.7, "elapsed_time": "0:42:30", "remaining_time": "0:22:11", "throughput": 5706.72, "total_tokens": 14555752} {"current_steps": 22290, "total_steps": 33920, "loss": 0.4115, "lr": 3.1739107183911953e-06, "epoch": 13.142688679245284, "percentage": 65.71, "elapsed_time": "0:42:31", "remaining_time": "0:22:11", "throughput": 5706.79, "total_tokens": 14558952} {"current_steps": 22295, "total_steps": 33920, "loss": 0.382, "lr": 3.1715159638613898e-06, "epoch": 13.14563679245283, "percentage": 65.73, "elapsed_time": "0:42:31", "remaining_time": "0:22:10", "throughput": 5707.11, "total_tokens": 14563560} {"current_steps": 22300, "total_steps": 33920, "loss": 0.3265, "lr": 3.1691216934306134e-06, "epoch": 13.148584905660377, "percentage": 65.74, "elapsed_time": "0:42:32", "remaining_time": "0:22:09", "throughput": 5707.26, "total_tokens": 14566984} {"current_steps": 22305, "total_steps": 33920, "loss": 0.2904, "lr": 3.16672790773276e-06, "epoch": 13.151533018867925, "percentage": 65.76, "elapsed_time": "0:42:32", "remaining_time": "0:22:09", "throughput": 5707.22, "total_tokens": 14569992} {"current_steps": 22310, "total_steps": 33920, "loss": 0.2653, "lr": 3.164334607401593e-06, "epoch": 13.154481132075471, "percentage": 65.77, "elapsed_time": "0:42:33", "remaining_time": "0:22:08", "throughput": 5707.3, "total_tokens": 14573544} {"current_steps": 22315, "total_steps": 33920, "loss": 0.3992, "lr": 3.1619417930707506e-06, "epoch": 13.15742924528302, "percentage": 65.79, "elapsed_time": "0:42:34", "remaining_time": "0:22:08", "throughput": 5707.3, "total_tokens": 14576584} {"current_steps": 22320, "total_steps": 33920, "loss": 0.3906, "lr": 3.1595494653737408e-06, "epoch": 13.160377358490566, "percentage": 65.8, "elapsed_time": "0:42:34", "remaining_time": "0:22:07", "throughput": 5707.32, "total_tokens": 14579624} {"current_steps": 22325, "total_steps": 33920, "loss": 0.4239, "lr": 3.1571576249439408e-06, "epoch": 13.163325471698114, "percentage": 65.82, "elapsed_time": "0:42:35", "remaining_time": "0:22:07", "throughput": 5707.48, "total_tokens": 14583304} {"current_steps": 22330, "total_steps": 33920, "loss": 0.2929, "lr": 3.1547662724146e-06, "epoch": 13.16627358490566, "percentage": 65.83, "elapsed_time": "0:42:35", "remaining_time": "0:22:06", "throughput": 5707.48, "total_tokens": 14586120} {"current_steps": 22335, "total_steps": 33920, "loss": 0.2204, "lr": 3.1523754084188436e-06, "epoch": 13.169221698113208, "percentage": 65.85, "elapsed_time": "0:42:36", "remaining_time": "0:22:05", "throughput": 5707.55, "total_tokens": 14589544} {"current_steps": 22340, "total_steps": 33920, "loss": 0.3502, "lr": 3.149985033589661e-06, "epoch": 13.172169811320755, "percentage": 65.86, "elapsed_time": "0:42:36", "remaining_time": "0:22:05", "throughput": 5707.77, "total_tokens": 14593576} {"current_steps": 22345, "total_steps": 33920, "loss": 0.4278, "lr": 3.147595148559912e-06, "epoch": 13.175117924528301, "percentage": 65.88, "elapsed_time": "0:42:37", "remaining_time": "0:22:04", "throughput": 5707.59, "total_tokens": 14595976} {"current_steps": 22350, "total_steps": 33920, "loss": 0.2835, "lr": 3.1452057539623328e-06, "epoch": 13.17806603773585, "percentage": 65.89, "elapsed_time": "0:42:37", "remaining_time": "0:22:04", "throughput": 5707.81, "total_tokens": 14600200} {"current_steps": 22355, "total_steps": 33920, "loss": 0.342, "lr": 3.142816850429523e-06, "epoch": 13.181014150943396, "percentage": 65.91, "elapsed_time": "0:42:38", "remaining_time": "0:22:03", "throughput": 5707.94, "total_tokens": 14603400} {"current_steps": 22360, "total_steps": 33920, "loss": 0.3212, "lr": 3.1404284385939552e-06, "epoch": 13.183962264150944, "percentage": 65.92, "elapsed_time": "0:42:38", "remaining_time": "0:22:02", "throughput": 5707.86, "total_tokens": 14606280} {"current_steps": 22365, "total_steps": 33920, "loss": 0.364, "lr": 3.138040519087975e-06, "epoch": 13.18691037735849, "percentage": 65.93, "elapsed_time": "0:42:39", "remaining_time": "0:22:02", "throughput": 5707.79, "total_tokens": 14609224} {"current_steps": 22370, "total_steps": 33920, "loss": 0.3287, "lr": 3.13565309254379e-06, "epoch": 13.189858490566039, "percentage": 65.95, "elapsed_time": "0:42:40", "remaining_time": "0:22:01", "throughput": 5707.65, "total_tokens": 14612008} {"current_steps": 22375, "total_steps": 33920, "loss": 0.3505, "lr": 3.1332661595934845e-06, "epoch": 13.192806603773585, "percentage": 65.96, "elapsed_time": "0:42:40", "remaining_time": "0:22:01", "throughput": 5707.6, "total_tokens": 14614888} {"current_steps": 22380, "total_steps": 33920, "loss": 0.4883, "lr": 3.130879720869008e-06, "epoch": 13.195754716981131, "percentage": 65.98, "elapsed_time": "0:42:41", "remaining_time": "0:22:00", "throughput": 5707.59, "total_tokens": 14617960} {"current_steps": 22385, "total_steps": 33920, "loss": 0.2341, "lr": 3.1284937770021815e-06, "epoch": 13.19870283018868, "percentage": 65.99, "elapsed_time": "0:42:41", "remaining_time": "0:22:00", "throughput": 5707.54, "total_tokens": 14620776} {"current_steps": 22390, "total_steps": 33920, "loss": 0.3882, "lr": 3.1261083286246916e-06, "epoch": 13.201650943396226, "percentage": 66.01, "elapsed_time": "0:42:42", "remaining_time": "0:21:59", "throughput": 5707.74, "total_tokens": 14624392} {"current_steps": 22395, "total_steps": 33920, "loss": 0.2625, "lr": 3.1237233763680997e-06, "epoch": 13.204599056603774, "percentage": 66.02, "elapsed_time": "0:42:42", "remaining_time": "0:21:58", "throughput": 5707.95, "total_tokens": 14628136} {"current_steps": 22400, "total_steps": 33920, "loss": 0.2881, "lr": 3.1213389208638303e-06, "epoch": 13.20754716981132, "percentage": 66.04, "elapsed_time": "0:42:43", "remaining_time": "0:21:58", "throughput": 5708.18, "total_tokens": 14632264} {"current_steps": 22405, "total_steps": 33920, "loss": 0.3104, "lr": 3.1189549627431757e-06, "epoch": 13.210495283018869, "percentage": 66.05, "elapsed_time": "0:42:43", "remaining_time": "0:21:57", "throughput": 5708.04, "total_tokens": 14634952} {"current_steps": 22410, "total_steps": 33920, "loss": 0.1907, "lr": 3.116571502637304e-06, "epoch": 13.213443396226415, "percentage": 66.07, "elapsed_time": "0:42:44", "remaining_time": "0:21:57", "throughput": 5707.96, "total_tokens": 14637864} {"current_steps": 22415, "total_steps": 33920, "loss": 0.3162, "lr": 3.1141885411772434e-06, "epoch": 13.216391509433961, "percentage": 66.08, "elapsed_time": "0:42:44", "remaining_time": "0:21:56", "throughput": 5707.78, "total_tokens": 14640296} {"current_steps": 22420, "total_steps": 33920, "loss": 0.2773, "lr": 3.111806078993893e-06, "epoch": 13.21933962264151, "percentage": 66.1, "elapsed_time": "0:42:45", "remaining_time": "0:21:55", "throughput": 5707.91, "total_tokens": 14643688} {"current_steps": 22425, "total_steps": 33920, "loss": 0.4029, "lr": 3.1094241167180223e-06, "epoch": 13.222287735849056, "percentage": 66.11, "elapsed_time": "0:42:46", "remaining_time": "0:21:55", "throughput": 5707.82, "total_tokens": 14646280} {"current_steps": 22430, "total_steps": 33920, "loss": 0.3263, "lr": 3.1070426549802623e-06, "epoch": 13.225235849056604, "percentage": 66.13, "elapsed_time": "0:42:46", "remaining_time": "0:21:54", "throughput": 5707.96, "total_tokens": 14650184} {"current_steps": 22435, "total_steps": 33920, "loss": 0.3968, "lr": 3.1046616944111196e-06, "epoch": 13.22818396226415, "percentage": 66.14, "elapsed_time": "0:42:47", "remaining_time": "0:21:54", "throughput": 5708.21, "total_tokens": 14654152} {"current_steps": 22440, "total_steps": 33920, "loss": 0.3581, "lr": 3.1022812356409606e-06, "epoch": 13.231132075471699, "percentage": 66.16, "elapsed_time": "0:42:47", "remaining_time": "0:21:53", "throughput": 5708.12, "total_tokens": 14656712} {"current_steps": 22445, "total_steps": 33920, "loss": 0.3072, "lr": 3.0999012793000244e-06, "epoch": 13.234080188679245, "percentage": 66.17, "elapsed_time": "0:42:48", "remaining_time": "0:21:53", "throughput": 5708.19, "total_tokens": 14659880} {"current_steps": 22450, "total_steps": 33920, "loss": 0.2346, "lr": 3.097521826018414e-06, "epoch": 13.237028301886792, "percentage": 66.19, "elapsed_time": "0:42:48", "remaining_time": "0:21:52", "throughput": 5708.4, "total_tokens": 14663752} {"current_steps": 22455, "total_steps": 33920, "loss": 0.4994, "lr": 3.0951428764260973e-06, "epoch": 13.23997641509434, "percentage": 66.2, "elapsed_time": "0:42:49", "remaining_time": "0:21:51", "throughput": 5708.49, "total_tokens": 14666984} {"current_steps": 22460, "total_steps": 33920, "loss": 0.3028, "lr": 3.092764431152915e-06, "epoch": 13.242924528301886, "percentage": 66.21, "elapsed_time": "0:42:49", "remaining_time": "0:21:51", "throughput": 5708.53, "total_tokens": 14669896} {"current_steps": 22465, "total_steps": 33920, "loss": 0.2516, "lr": 3.0903864908285693e-06, "epoch": 13.245872641509434, "percentage": 66.23, "elapsed_time": "0:42:50", "remaining_time": "0:21:50", "throughput": 5708.68, "total_tokens": 14673704} {"current_steps": 22470, "total_steps": 33920, "loss": 0.3128, "lr": 3.088009056082629e-06, "epoch": 13.24882075471698, "percentage": 66.24, "elapsed_time": "0:42:50", "remaining_time": "0:21:50", "throughput": 5708.69, "total_tokens": 14676680} {"current_steps": 22475, "total_steps": 33920, "loss": 0.3558, "lr": 3.0856321275445324e-06, "epoch": 13.251768867924529, "percentage": 66.26, "elapsed_time": "0:42:51", "remaining_time": "0:21:49", "throughput": 5708.71, "total_tokens": 14679656} {"current_steps": 22480, "total_steps": 33920, "loss": 0.4397, "lr": 3.0832557058435808e-06, "epoch": 13.254716981132075, "percentage": 66.27, "elapsed_time": "0:42:51", "remaining_time": "0:21:48", "throughput": 5708.48, "total_tokens": 14681736} {"current_steps": 22485, "total_steps": 33920, "loss": 0.3563, "lr": 3.0808797916089405e-06, "epoch": 13.257665094339623, "percentage": 66.29, "elapsed_time": "0:42:52", "remaining_time": "0:21:48", "throughput": 5708.63, "total_tokens": 14685256} {"current_steps": 22490, "total_steps": 33920, "loss": 0.3046, "lr": 3.078504385469647e-06, "epoch": 13.26061320754717, "percentage": 66.3, "elapsed_time": "0:42:53", "remaining_time": "0:21:47", "throughput": 5708.77, "total_tokens": 14688776} {"current_steps": 22495, "total_steps": 33920, "loss": 0.3171, "lr": 3.076129488054599e-06, "epoch": 13.263561320754716, "percentage": 66.32, "elapsed_time": "0:42:53", "remaining_time": "0:21:47", "throughput": 5708.79, "total_tokens": 14691720} {"current_steps": 22500, "total_steps": 33920, "loss": 0.3176, "lr": 3.0737550999925604e-06, "epoch": 13.266509433962264, "percentage": 66.33, "elapsed_time": "0:42:54", "remaining_time": "0:21:46", "throughput": 5708.71, "total_tokens": 14694376} {"current_steps": 22505, "total_steps": 33920, "loss": 0.3899, "lr": 3.0713812219121604e-06, "epoch": 13.26945754716981, "percentage": 66.35, "elapsed_time": "0:42:54", "remaining_time": "0:21:45", "throughput": 5708.79, "total_tokens": 14698376} {"current_steps": 22510, "total_steps": 33920, "loss": 0.3128, "lr": 3.0690078544418934e-06, "epoch": 13.272405660377359, "percentage": 66.36, "elapsed_time": "0:42:55", "remaining_time": "0:21:45", "throughput": 5708.83, "total_tokens": 14701704} {"current_steps": 22515, "total_steps": 33920, "loss": 0.4028, "lr": 3.0666349982101198e-06, "epoch": 13.275353773584905, "percentage": 66.38, "elapsed_time": "0:42:55", "remaining_time": "0:21:44", "throughput": 5708.9, "total_tokens": 14704936} {"current_steps": 22520, "total_steps": 33920, "loss": 0.3548, "lr": 3.0642626538450627e-06, "epoch": 13.278301886792454, "percentage": 66.39, "elapsed_time": "0:42:56", "remaining_time": "0:21:44", "throughput": 5708.95, "total_tokens": 14707976} {"current_steps": 22525, "total_steps": 33920, "loss": 0.4021, "lr": 3.061890821974809e-06, "epoch": 13.28125, "percentage": 66.41, "elapsed_time": "0:42:56", "remaining_time": "0:21:43", "throughput": 5708.87, "total_tokens": 14710728} {"current_steps": 22530, "total_steps": 33920, "loss": 0.361, "lr": 3.059519503227313e-06, "epoch": 13.284198113207546, "percentage": 66.42, "elapsed_time": "0:42:57", "remaining_time": "0:21:43", "throughput": 5709.03, "total_tokens": 14714472} {"current_steps": 22535, "total_steps": 33920, "loss": 0.2191, "lr": 3.057148698230393e-06, "epoch": 13.287146226415095, "percentage": 66.44, "elapsed_time": "0:42:57", "remaining_time": "0:21:42", "throughput": 5708.89, "total_tokens": 14716840} {"current_steps": 22540, "total_steps": 33920, "loss": 0.3205, "lr": 3.0547784076117294e-06, "epoch": 13.290094339622641, "percentage": 66.45, "elapsed_time": "0:42:58", "remaining_time": "0:21:41", "throughput": 5708.8, "total_tokens": 14719336} {"current_steps": 22545, "total_steps": 33920, "loss": 0.3142, "lr": 3.0524086319988635e-06, "epoch": 13.29304245283019, "percentage": 66.47, "elapsed_time": "0:42:58", "remaining_time": "0:21:41", "throughput": 5708.67, "total_tokens": 14721896} {"current_steps": 22550, "total_steps": 33920, "loss": 0.2795, "lr": 3.0500393720192074e-06, "epoch": 13.295990566037736, "percentage": 66.48, "elapsed_time": "0:42:59", "remaining_time": "0:21:40", "throughput": 5708.91, "total_tokens": 14725800} {"current_steps": 22555, "total_steps": 33920, "loss": 0.4061, "lr": 3.047670628300031e-06, "epoch": 13.298938679245284, "percentage": 66.49, "elapsed_time": "0:43:00", "remaining_time": "0:21:40", "throughput": 5709.0, "total_tokens": 14729480} {"current_steps": 22560, "total_steps": 33920, "loss": 0.2783, "lr": 3.0453024014684694e-06, "epoch": 13.30188679245283, "percentage": 66.51, "elapsed_time": "0:43:00", "remaining_time": "0:21:39", "throughput": 5709.11, "total_tokens": 14732680} {"current_steps": 22565, "total_steps": 33920, "loss": 0.3391, "lr": 3.0429346921515225e-06, "epoch": 13.304834905660377, "percentage": 66.52, "elapsed_time": "0:43:01", "remaining_time": "0:21:38", "throughput": 5709.17, "total_tokens": 14736488} {"current_steps": 22570, "total_steps": 33920, "loss": 0.3137, "lr": 3.04056750097605e-06, "epoch": 13.307783018867925, "percentage": 66.54, "elapsed_time": "0:43:01", "remaining_time": "0:21:38", "throughput": 5709.35, "total_tokens": 14739976} {"current_steps": 22575, "total_steps": 33920, "loss": 0.2779, "lr": 3.0382008285687754e-06, "epoch": 13.310731132075471, "percentage": 66.55, "elapsed_time": "0:43:02", "remaining_time": "0:21:37", "throughput": 5709.34, "total_tokens": 14742792} {"current_steps": 22580, "total_steps": 33920, "loss": 0.325, "lr": 3.035834675556287e-06, "epoch": 13.31367924528302, "percentage": 66.57, "elapsed_time": "0:43:02", "remaining_time": "0:21:37", "throughput": 5709.53, "total_tokens": 14746824} {"current_steps": 22585, "total_steps": 33920, "loss": 0.2529, "lr": 3.0334690425650336e-06, "epoch": 13.316627358490566, "percentage": 66.58, "elapsed_time": "0:43:03", "remaining_time": "0:21:36", "throughput": 5709.66, "total_tokens": 14750408} {"current_steps": 22590, "total_steps": 33920, "loss": 0.3458, "lr": 3.031103930221325e-06, "epoch": 13.319575471698114, "percentage": 66.6, "elapsed_time": "0:43:03", "remaining_time": "0:21:35", "throughput": 5709.69, "total_tokens": 14753352} {"current_steps": 22595, "total_steps": 33920, "loss": 0.2599, "lr": 3.028739339151338e-06, "epoch": 13.32252358490566, "percentage": 66.61, "elapsed_time": "0:43:04", "remaining_time": "0:21:35", "throughput": 5709.73, "total_tokens": 14756264} {"current_steps": 22600, "total_steps": 33920, "loss": 0.3395, "lr": 3.0263752699811067e-06, "epoch": 13.325471698113208, "percentage": 66.63, "elapsed_time": "0:43:04", "remaining_time": "0:21:34", "throughput": 5709.75, "total_tokens": 14759048} {"current_steps": 22605, "total_steps": 33920, "loss": 0.2788, "lr": 3.0240117233365267e-06, "epoch": 13.328419811320755, "percentage": 66.64, "elapsed_time": "0:43:05", "remaining_time": "0:21:34", "throughput": 5709.84, "total_tokens": 14762248} {"current_steps": 22610, "total_steps": 33920, "loss": 0.2963, "lr": 3.0216486998433604e-06, "epoch": 13.331367924528301, "percentage": 66.66, "elapsed_time": "0:43:05", "remaining_time": "0:21:33", "throughput": 5709.96, "total_tokens": 14765544} {"current_steps": 22615, "total_steps": 33920, "loss": 0.2308, "lr": 3.0192862001272273e-06, "epoch": 13.33431603773585, "percentage": 66.67, "elapsed_time": "0:43:06", "remaining_time": "0:21:32", "throughput": 5710.03, "total_tokens": 14768584} {"current_steps": 22620, "total_steps": 33920, "loss": 0.3515, "lr": 3.0169242248136066e-06, "epoch": 13.337264150943396, "percentage": 66.69, "elapsed_time": "0:43:06", "remaining_time": "0:21:32", "throughput": 5710.08, "total_tokens": 14771496} {"current_steps": 22625, "total_steps": 33920, "loss": 0.3583, "lr": 3.0145627745278457e-06, "epoch": 13.340212264150944, "percentage": 66.7, "elapsed_time": "0:43:07", "remaining_time": "0:21:31", "throughput": 5710.21, "total_tokens": 14775016} {"current_steps": 22630, "total_steps": 33920, "loss": 0.4992, "lr": 3.0122018498951478e-06, "epoch": 13.34316037735849, "percentage": 66.72, "elapsed_time": "0:43:08", "remaining_time": "0:21:31", "throughput": 5710.56, "total_tokens": 14781096} {"current_steps": 22635, "total_steps": 33920, "loss": 0.307, "lr": 3.0098414515405765e-06, "epoch": 13.346108490566039, "percentage": 66.73, "elapsed_time": "0:43:08", "remaining_time": "0:21:30", "throughput": 5710.45, "total_tokens": 14783528} {"current_steps": 22640, "total_steps": 33920, "loss": 0.3143, "lr": 3.0074815800890576e-06, "epoch": 13.349056603773585, "percentage": 66.75, "elapsed_time": "0:43:09", "remaining_time": "0:21:30", "throughput": 5710.49, "total_tokens": 14786728} {"current_steps": 22645, "total_steps": 33920, "loss": 0.3502, "lr": 3.005122236165378e-06, "epoch": 13.352004716981131, "percentage": 66.76, "elapsed_time": "0:43:09", "remaining_time": "0:21:29", "throughput": 5710.44, "total_tokens": 14789480} {"current_steps": 22650, "total_steps": 33920, "loss": 0.2423, "lr": 3.0027634203941847e-06, "epoch": 13.35495283018868, "percentage": 66.77, "elapsed_time": "0:43:10", "remaining_time": "0:21:28", "throughput": 5710.51, "total_tokens": 14792488} {"current_steps": 22655, "total_steps": 33920, "loss": 0.3403, "lr": 3.0004051333999816e-06, "epoch": 13.357900943396226, "percentage": 66.79, "elapsed_time": "0:43:10", "remaining_time": "0:21:28", "throughput": 5710.52, "total_tokens": 14795368} {"current_steps": 22660, "total_steps": 33920, "loss": 0.3229, "lr": 2.998047375807139e-06, "epoch": 13.360849056603774, "percentage": 66.8, "elapsed_time": "0:43:11", "remaining_time": "0:21:27", "throughput": 5710.62, "total_tokens": 14799112} {"current_steps": 22665, "total_steps": 33920, "loss": 0.2957, "lr": 2.995690148239881e-06, "epoch": 13.36379716981132, "percentage": 66.82, "elapsed_time": "0:43:12", "remaining_time": "0:21:27", "throughput": 5710.81, "total_tokens": 14802920} {"current_steps": 22670, "total_steps": 33920, "loss": 0.2759, "lr": 2.993333451322293e-06, "epoch": 13.366745283018869, "percentage": 66.83, "elapsed_time": "0:43:12", "remaining_time": "0:21:26", "throughput": 5710.83, "total_tokens": 14805704} {"current_steps": 22675, "total_steps": 33920, "loss": 0.3963, "lr": 2.9909772856783242e-06, "epoch": 13.369693396226415, "percentage": 66.85, "elapsed_time": "0:43:13", "remaining_time": "0:21:25", "throughput": 5710.89, "total_tokens": 14808584} {"current_steps": 22680, "total_steps": 33920, "loss": 0.2733, "lr": 2.988621651931777e-06, "epoch": 13.372641509433961, "percentage": 66.86, "elapsed_time": "0:43:13", "remaining_time": "0:21:25", "throughput": 5711.09, "total_tokens": 14813512} {"current_steps": 22685, "total_steps": 33920, "loss": 0.3186, "lr": 2.986266550706315e-06, "epoch": 13.37558962264151, "percentage": 66.88, "elapsed_time": "0:43:14", "remaining_time": "0:21:24", "throughput": 5711.21, "total_tokens": 14817096} {"current_steps": 22690, "total_steps": 33920, "loss": 0.3839, "lr": 2.9839119826254627e-06, "epoch": 13.378537735849056, "percentage": 66.89, "elapsed_time": "0:43:14", "remaining_time": "0:21:24", "throughput": 5711.13, "total_tokens": 14819688} {"current_steps": 22695, "total_steps": 33920, "loss": 0.4517, "lr": 2.981557948312602e-06, "epoch": 13.381485849056604, "percentage": 66.91, "elapsed_time": "0:43:15", "remaining_time": "0:21:23", "throughput": 5711.08, "total_tokens": 14822312} {"current_steps": 22700, "total_steps": 33920, "loss": 0.3721, "lr": 2.9792044483909733e-06, "epoch": 13.38443396226415, "percentage": 66.92, "elapsed_time": "0:43:15", "remaining_time": "0:21:23", "throughput": 5710.96, "total_tokens": 14824744} {"current_steps": 22705, "total_steps": 33920, "loss": 0.4582, "lr": 2.9768514834836767e-06, "epoch": 13.387382075471699, "percentage": 66.94, "elapsed_time": "0:43:16", "remaining_time": "0:21:22", "throughput": 5711.06, "total_tokens": 14828200} {"current_steps": 22710, "total_steps": 33920, "loss": 0.3289, "lr": 2.9744990542136685e-06, "epoch": 13.390330188679245, "percentage": 66.95, "elapsed_time": "0:43:16", "remaining_time": "0:21:21", "throughput": 5711.12, "total_tokens": 14831304} {"current_steps": 22715, "total_steps": 33920, "loss": 0.4045, "lr": 2.9721471612037637e-06, "epoch": 13.393278301886792, "percentage": 66.97, "elapsed_time": "0:43:17", "remaining_time": "0:21:21", "throughput": 5711.39, "total_tokens": 14835752} {"current_steps": 22720, "total_steps": 33920, "loss": 0.3673, "lr": 2.9697958050766385e-06, "epoch": 13.39622641509434, "percentage": 66.98, "elapsed_time": "0:43:18", "remaining_time": "0:21:20", "throughput": 5711.46, "total_tokens": 14838920} {"current_steps": 22725, "total_steps": 33920, "loss": 0.3679, "lr": 2.967444986454825e-06, "epoch": 13.399174528301886, "percentage": 67.0, "elapsed_time": "0:43:18", "remaining_time": "0:21:20", "throughput": 5711.63, "total_tokens": 14842600} {"current_steps": 22730, "total_steps": 33920, "loss": 0.2756, "lr": 2.9650947059607106e-06, "epoch": 13.402122641509434, "percentage": 67.01, "elapsed_time": "0:43:19", "remaining_time": "0:21:19", "throughput": 5711.65, "total_tokens": 14845416} {"current_steps": 22735, "total_steps": 33920, "loss": 0.3059, "lr": 2.962744964216542e-06, "epoch": 13.40507075471698, "percentage": 67.03, "elapsed_time": "0:43:19", "remaining_time": "0:21:18", "throughput": 5711.53, "total_tokens": 14847848} {"current_steps": 22740, "total_steps": 33920, "loss": 0.3736, "lr": 2.960395761844425e-06, "epoch": 13.408018867924529, "percentage": 67.04, "elapsed_time": "0:43:20", "remaining_time": "0:21:18", "throughput": 5711.58, "total_tokens": 14850856} {"current_steps": 22745, "total_steps": 33920, "loss": 0.4219, "lr": 2.95804709946632e-06, "epoch": 13.410966981132075, "percentage": 67.05, "elapsed_time": "0:43:20", "remaining_time": "0:21:17", "throughput": 5711.53, "total_tokens": 14853704} {"current_steps": 22750, "total_steps": 33920, "loss": 0.233, "lr": 2.9556989777040457e-06, "epoch": 13.413915094339623, "percentage": 67.07, "elapsed_time": "0:43:21", "remaining_time": "0:21:17", "throughput": 5711.52, "total_tokens": 14856872} {"current_steps": 22755, "total_steps": 33920, "loss": 0.4429, "lr": 2.9533513971792776e-06, "epoch": 13.41686320754717, "percentage": 67.08, "elapsed_time": "0:43:21", "remaining_time": "0:21:16", "throughput": 5711.31, "total_tokens": 14859304} {"current_steps": 22760, "total_steps": 33920, "loss": 0.2641, "lr": 2.9510043585135473e-06, "epoch": 13.419811320754716, "percentage": 67.1, "elapsed_time": "0:43:22", "remaining_time": "0:21:16", "throughput": 5711.4, "total_tokens": 14862920} {"current_steps": 22765, "total_steps": 33920, "loss": 0.3865, "lr": 2.948657862328244e-06, "epoch": 13.422759433962264, "percentage": 67.11, "elapsed_time": "0:43:22", "remaining_time": "0:21:15", "throughput": 5711.65, "total_tokens": 14867176} {"current_steps": 22770, "total_steps": 33920, "loss": 0.3741, "lr": 2.946311909244613e-06, "epoch": 13.42570754716981, "percentage": 67.13, "elapsed_time": "0:43:23", "remaining_time": "0:21:14", "throughput": 5711.77, "total_tokens": 14870568} {"current_steps": 22775, "total_steps": 33920, "loss": 0.4991, "lr": 2.9439664998837538e-06, "epoch": 13.428655660377359, "percentage": 67.14, "elapsed_time": "0:43:23", "remaining_time": "0:21:14", "throughput": 5711.76, "total_tokens": 14873384} {"current_steps": 22780, "total_steps": 33920, "loss": 0.3299, "lr": 2.941621634866626e-06, "epoch": 13.431603773584905, "percentage": 67.16, "elapsed_time": "0:43:24", "remaining_time": "0:21:13", "throughput": 5711.86, "total_tokens": 14876648} {"current_steps": 22785, "total_steps": 33920, "loss": 0.3602, "lr": 2.9392773148140406e-06, "epoch": 13.434551886792454, "percentage": 67.17, "elapsed_time": "0:43:25", "remaining_time": "0:21:13", "throughput": 5711.96, "total_tokens": 14879976} {"current_steps": 22790, "total_steps": 33920, "loss": 0.293, "lr": 2.9369335403466676e-06, "epoch": 13.4375, "percentage": 67.19, "elapsed_time": "0:43:25", "remaining_time": "0:21:12", "throughput": 5711.9, "total_tokens": 14882632} {"current_steps": 22795, "total_steps": 33920, "loss": 0.5075, "lr": 2.9345903120850318e-06, "epoch": 13.440448113207546, "percentage": 67.2, "elapsed_time": "0:43:26", "remaining_time": "0:21:11", "throughput": 5711.78, "total_tokens": 14885480} {"current_steps": 22800, "total_steps": 33920, "loss": 0.3684, "lr": 2.932247630649512e-06, "epoch": 13.443396226415095, "percentage": 67.22, "elapsed_time": "0:43:26", "remaining_time": "0:21:11", "throughput": 5711.69, "total_tokens": 14888328} {"current_steps": 22805, "total_steps": 33920, "loss": 0.3042, "lr": 2.9299054966603424e-06, "epoch": 13.446344339622641, "percentage": 67.23, "elapsed_time": "0:43:27", "remaining_time": "0:21:10", "throughput": 5711.78, "total_tokens": 14891688} {"current_steps": 22810, "total_steps": 33920, "loss": 0.29, "lr": 2.927563910737613e-06, "epoch": 13.44929245283019, "percentage": 67.25, "elapsed_time": "0:43:27", "remaining_time": "0:21:10", "throughput": 5711.79, "total_tokens": 14894504} {"current_steps": 22815, "total_steps": 33920, "loss": 0.2846, "lr": 2.9252228735012722e-06, "epoch": 13.452240566037736, "percentage": 67.26, "elapsed_time": "0:43:28", "remaining_time": "0:21:09", "throughput": 5711.67, "total_tokens": 14897128} {"current_steps": 22820, "total_steps": 33920, "loss": 0.2392, "lr": 2.9228823855711174e-06, "epoch": 13.455188679245284, "percentage": 67.28, "elapsed_time": "0:43:28", "remaining_time": "0:21:09", "throughput": 5711.96, "total_tokens": 14902088} {"current_steps": 22825, "total_steps": 33920, "loss": 0.3595, "lr": 2.920542447566802e-06, "epoch": 13.45813679245283, "percentage": 67.29, "elapsed_time": "0:43:29", "remaining_time": "0:21:08", "throughput": 5711.97, "total_tokens": 14905064} {"current_steps": 22830, "total_steps": 33920, "loss": 0.4227, "lr": 2.918203060107837e-06, "epoch": 13.461084905660377, "percentage": 67.31, "elapsed_time": "0:43:30", "remaining_time": "0:21:07", "throughput": 5712.05, "total_tokens": 14908456} {"current_steps": 22835, "total_steps": 33920, "loss": 0.3822, "lr": 2.9158642238135813e-06, "epoch": 13.464033018867925, "percentage": 67.32, "elapsed_time": "0:43:30", "remaining_time": "0:21:07", "throughput": 5712.27, "total_tokens": 14912456} {"current_steps": 22840, "total_steps": 33920, "loss": 0.413, "lr": 2.913525939303257e-06, "epoch": 13.466981132075471, "percentage": 67.33, "elapsed_time": "0:43:31", "remaining_time": "0:21:06", "throughput": 5712.28, "total_tokens": 14915656} {"current_steps": 22845, "total_steps": 33920, "loss": 0.3186, "lr": 2.9111882071959317e-06, "epoch": 13.46992924528302, "percentage": 67.35, "elapsed_time": "0:43:31", "remaining_time": "0:21:06", "throughput": 5712.28, "total_tokens": 14918792} {"current_steps": 22850, "total_steps": 33920, "loss": 0.3136, "lr": 2.908851028110532e-06, "epoch": 13.472877358490566, "percentage": 67.36, "elapsed_time": "0:43:32", "remaining_time": "0:21:05", "throughput": 5712.46, "total_tokens": 14923112} {"current_steps": 22855, "total_steps": 33920, "loss": 0.2736, "lr": 2.906514402665834e-06, "epoch": 13.475825471698114, "percentage": 67.38, "elapsed_time": "0:43:32", "remaining_time": "0:21:05", "throughput": 5712.62, "total_tokens": 14926632} {"current_steps": 22860, "total_steps": 33920, "loss": 0.3132, "lr": 2.9041783314804705e-06, "epoch": 13.47877358490566, "percentage": 67.39, "elapsed_time": "0:43:33", "remaining_time": "0:21:04", "throughput": 5712.59, "total_tokens": 14929448} {"current_steps": 22865, "total_steps": 33920, "loss": 0.3507, "lr": 2.9018428151729238e-06, "epoch": 13.481721698113208, "percentage": 67.41, "elapsed_time": "0:43:33", "remaining_time": "0:21:03", "throughput": 5712.37, "total_tokens": 14931752} {"current_steps": 22870, "total_steps": 33920, "loss": 0.2298, "lr": 2.899507854361537e-06, "epoch": 13.484669811320755, "percentage": 67.42, "elapsed_time": "0:43:34", "remaining_time": "0:21:03", "throughput": 5712.23, "total_tokens": 14934376} {"current_steps": 22875, "total_steps": 33920, "loss": 0.3315, "lr": 2.8971734496644975e-06, "epoch": 13.487617924528301, "percentage": 67.44, "elapsed_time": "0:43:34", "remaining_time": "0:21:02", "throughput": 5712.15, "total_tokens": 14937064} {"current_steps": 22880, "total_steps": 33920, "loss": 0.4637, "lr": 2.894839601699851e-06, "epoch": 13.49056603773585, "percentage": 67.45, "elapsed_time": "0:43:35", "remaining_time": "0:21:02", "throughput": 5712.23, "total_tokens": 14940616} {"current_steps": 22885, "total_steps": 33920, "loss": 0.361, "lr": 2.8925063110854923e-06, "epoch": 13.493514150943396, "percentage": 67.47, "elapsed_time": "0:43:36", "remaining_time": "0:21:01", "throughput": 5712.48, "total_tokens": 14944968} {"current_steps": 22890, "total_steps": 33920, "loss": 0.4699, "lr": 2.8901735784391683e-06, "epoch": 13.496462264150944, "percentage": 67.48, "elapsed_time": "0:43:36", "remaining_time": "0:21:00", "throughput": 5712.58, "total_tokens": 14948488} {"current_steps": 22895, "total_steps": 33920, "loss": 0.4044, "lr": 2.8878414043784844e-06, "epoch": 13.49941037735849, "percentage": 67.5, "elapsed_time": "0:43:37", "remaining_time": "0:21:00", "throughput": 5712.5, "total_tokens": 14951176} {"current_steps": 22900, "total_steps": 33920, "loss": 0.2662, "lr": 2.885509789520891e-06, "epoch": 13.502358490566039, "percentage": 67.51, "elapsed_time": "0:43:37", "remaining_time": "0:20:59", "throughput": 5712.27, "total_tokens": 14953448} {"current_steps": 22905, "total_steps": 33920, "loss": 0.3374, "lr": 2.8831787344836926e-06, "epoch": 13.505306603773585, "percentage": 67.53, "elapsed_time": "0:43:38", "remaining_time": "0:20:59", "throughput": 5712.26, "total_tokens": 14956232} {"current_steps": 22910, "total_steps": 33920, "loss": 0.3452, "lr": 2.880848239884049e-06, "epoch": 13.508254716981131, "percentage": 67.54, "elapsed_time": "0:43:38", "remaining_time": "0:20:58", "throughput": 5712.38, "total_tokens": 14960072} {"current_steps": 22915, "total_steps": 33920, "loss": 0.2982, "lr": 2.8785183063389667e-06, "epoch": 13.51120283018868, "percentage": 67.56, "elapsed_time": "0:43:39", "remaining_time": "0:20:58", "throughput": 5712.59, "total_tokens": 14963944} {"current_steps": 22920, "total_steps": 33920, "loss": 0.3902, "lr": 2.876188934465306e-06, "epoch": 13.514150943396226, "percentage": 67.57, "elapsed_time": "0:43:39", "remaining_time": "0:20:57", "throughput": 5712.56, "total_tokens": 14966888} {"current_steps": 22925, "total_steps": 33920, "loss": 0.3042, "lr": 2.8738601248797758e-06, "epoch": 13.517099056603774, "percentage": 67.59, "elapsed_time": "0:43:40", "remaining_time": "0:20:56", "throughput": 5712.62, "total_tokens": 14969992} {"current_steps": 22930, "total_steps": 33920, "loss": 0.4694, "lr": 2.8715318781989432e-06, "epoch": 13.52004716981132, "percentage": 67.6, "elapsed_time": "0:43:41", "remaining_time": "0:20:56", "throughput": 5712.59, "total_tokens": 14972808} {"current_steps": 22935, "total_steps": 33920, "loss": 0.2504, "lr": 2.869204195039219e-06, "epoch": 13.522995283018869, "percentage": 67.61, "elapsed_time": "0:43:41", "remaining_time": "0:20:55", "throughput": 5712.67, "total_tokens": 14976264} {"current_steps": 22940, "total_steps": 33920, "loss": 0.3181, "lr": 2.8668770760168673e-06, "epoch": 13.525943396226415, "percentage": 67.63, "elapsed_time": "0:43:42", "remaining_time": "0:20:55", "throughput": 5712.78, "total_tokens": 14979912} {"current_steps": 22945, "total_steps": 33920, "loss": 0.343, "lr": 2.864550521748003e-06, "epoch": 13.528891509433961, "percentage": 67.64, "elapsed_time": "0:43:42", "remaining_time": "0:20:54", "throughput": 5712.83, "total_tokens": 14983176} {"current_steps": 22950, "total_steps": 33920, "loss": 0.2512, "lr": 2.862224532848591e-06, "epoch": 13.53183962264151, "percentage": 67.66, "elapsed_time": "0:43:43", "remaining_time": "0:20:53", "throughput": 5712.83, "total_tokens": 14986184} {"current_steps": 22955, "total_steps": 33920, "loss": 0.3083, "lr": 2.8598991099344455e-06, "epoch": 13.534787735849056, "percentage": 67.67, "elapsed_time": "0:43:43", "remaining_time": "0:20:53", "throughput": 5712.95, "total_tokens": 14989832} {"current_steps": 22960, "total_steps": 33920, "loss": 0.4403, "lr": 2.857574253621236e-06, "epoch": 13.537735849056604, "percentage": 67.69, "elapsed_time": "0:43:44", "remaining_time": "0:20:52", "throughput": 5712.82, "total_tokens": 14992616} {"current_steps": 22965, "total_steps": 33920, "loss": 0.4873, "lr": 2.855249964524476e-06, "epoch": 13.54068396226415, "percentage": 67.7, "elapsed_time": "0:43:44", "remaining_time": "0:20:52", "throughput": 5712.94, "total_tokens": 14996424} {"current_steps": 22970, "total_steps": 33920, "loss": 0.3503, "lr": 2.852926243259531e-06, "epoch": 13.543632075471699, "percentage": 67.72, "elapsed_time": "0:43:45", "remaining_time": "0:20:51", "throughput": 5712.92, "total_tokens": 14999400} {"current_steps": 22975, "total_steps": 33920, "loss": 0.3814, "lr": 2.850603090441617e-06, "epoch": 13.546580188679245, "percentage": 67.73, "elapsed_time": "0:43:46", "remaining_time": "0:20:51", "throughput": 5712.71, "total_tokens": 15001928} {"current_steps": 22980, "total_steps": 33920, "loss": 0.2914, "lr": 2.848280506685798e-06, "epoch": 13.549528301886792, "percentage": 67.75, "elapsed_time": "0:43:46", "remaining_time": "0:20:50", "throughput": 5712.67, "total_tokens": 15005256} {"current_steps": 22985, "total_steps": 33920, "loss": 0.3507, "lr": 2.845958492606986e-06, "epoch": 13.55247641509434, "percentage": 67.76, "elapsed_time": "0:43:47", "remaining_time": "0:20:49", "throughput": 5712.79, "total_tokens": 15009256} {"current_steps": 22990, "total_steps": 33920, "loss": 0.2759, "lr": 2.843637048819949e-06, "epoch": 13.555424528301886, "percentage": 67.78, "elapsed_time": "0:43:47", "remaining_time": "0:20:49", "throughput": 5712.81, "total_tokens": 15012104} {"current_steps": 22995, "total_steps": 33920, "loss": 0.4352, "lr": 2.8413161759392966e-06, "epoch": 13.558372641509434, "percentage": 67.79, "elapsed_time": "0:43:48", "remaining_time": "0:20:48", "throughput": 5712.79, "total_tokens": 15015176} {"current_steps": 23000, "total_steps": 33920, "loss": 0.3515, "lr": 2.8389958745794878e-06, "epoch": 13.56132075471698, "percentage": 67.81, "elapsed_time": "0:43:48", "remaining_time": "0:20:48", "throughput": 5712.95, "total_tokens": 15018920} {"current_steps": 23005, "total_steps": 33920, "loss": 0.3874, "lr": 2.8366761453548366e-06, "epoch": 13.564268867924529, "percentage": 67.82, "elapsed_time": "0:43:49", "remaining_time": "0:20:47", "throughput": 5713.05, "total_tokens": 15022536} {"current_steps": 23010, "total_steps": 33920, "loss": 0.3192, "lr": 2.8343569888795e-06, "epoch": 13.567216981132075, "percentage": 67.84, "elapsed_time": "0:43:50", "remaining_time": "0:20:46", "throughput": 5713.12, "total_tokens": 15025576} {"current_steps": 23015, "total_steps": 33920, "loss": 0.4975, "lr": 2.832038405767483e-06, "epoch": 13.570165094339622, "percentage": 67.85, "elapsed_time": "0:43:51", "remaining_time": "0:20:46", "throughput": 5713.58, "total_tokens": 15032936} {"current_steps": 23020, "total_steps": 33920, "loss": 0.4222, "lr": 2.8297203966326397e-06, "epoch": 13.57311320754717, "percentage": 67.87, "elapsed_time": "0:43:51", "remaining_time": "0:20:46", "throughput": 5713.4, "total_tokens": 15035336} {"current_steps": 23025, "total_steps": 33920, "loss": 0.3654, "lr": 2.8274029620886773e-06, "epoch": 13.576061320754716, "percentage": 67.88, "elapsed_time": "0:43:52", "remaining_time": "0:20:45", "throughput": 5713.56, "total_tokens": 15038984} {"current_steps": 23030, "total_steps": 33920, "loss": 0.3568, "lr": 2.825086102749144e-06, "epoch": 13.579009433962264, "percentage": 67.9, "elapsed_time": "0:43:52", "remaining_time": "0:20:44", "throughput": 5713.71, "total_tokens": 15042696} {"current_steps": 23035, "total_steps": 33920, "loss": 0.3471, "lr": 2.822769819227438e-06, "epoch": 13.58195754716981, "percentage": 67.91, "elapsed_time": "0:43:53", "remaining_time": "0:20:44", "throughput": 5713.69, "total_tokens": 15045512} {"current_steps": 23040, "total_steps": 33920, "loss": 0.3416, "lr": 2.8204541121368055e-06, "epoch": 13.584905660377359, "percentage": 67.92, "elapsed_time": "0:43:53", "remaining_time": "0:20:43", "throughput": 5713.69, "total_tokens": 15048520} {"current_steps": 23045, "total_steps": 33920, "loss": 0.2729, "lr": 2.8181389820903402e-06, "epoch": 13.587853773584905, "percentage": 67.94, "elapsed_time": "0:43:54", "remaining_time": "0:20:43", "throughput": 5713.74, "total_tokens": 15051720} {"current_steps": 23050, "total_steps": 33920, "loss": 0.3268, "lr": 2.8158244297009814e-06, "epoch": 13.590801886792454, "percentage": 67.95, "elapsed_time": "0:43:54", "remaining_time": "0:20:42", "throughput": 5713.86, "total_tokens": 15055304} {"current_steps": 23055, "total_steps": 33920, "loss": 0.4602, "lr": 2.8135104555815196e-06, "epoch": 13.59375, "percentage": 67.97, "elapsed_time": "0:43:55", "remaining_time": "0:20:41", "throughput": 5713.82, "total_tokens": 15058184} {"current_steps": 23060, "total_steps": 33920, "loss": 0.2435, "lr": 2.811197060344588e-06, "epoch": 13.596698113207546, "percentage": 67.98, "elapsed_time": "0:43:55", "remaining_time": "0:20:41", "throughput": 5713.84, "total_tokens": 15061288} {"current_steps": 23065, "total_steps": 33920, "loss": 0.2613, "lr": 2.8088842446026677e-06, "epoch": 13.599646226415095, "percentage": 68.0, "elapsed_time": "0:43:56", "remaining_time": "0:20:40", "throughput": 5713.88, "total_tokens": 15064488} {"current_steps": 23070, "total_steps": 33920, "loss": 0.2765, "lr": 2.806572008968087e-06, "epoch": 13.602594339622641, "percentage": 68.01, "elapsed_time": "0:43:57", "remaining_time": "0:20:40", "throughput": 5714.11, "total_tokens": 15068680} {"current_steps": 23075, "total_steps": 33920, "loss": 0.2525, "lr": 2.80426035405302e-06, "epoch": 13.60554245283019, "percentage": 68.03, "elapsed_time": "0:43:57", "remaining_time": "0:20:39", "throughput": 5714.17, "total_tokens": 15071784} {"current_steps": 23080, "total_steps": 33920, "loss": 0.2494, "lr": 2.8019492804694852e-06, "epoch": 13.608490566037736, "percentage": 68.04, "elapsed_time": "0:43:58", "remaining_time": "0:20:39", "throughput": 5714.14, "total_tokens": 15074824} {"current_steps": 23085, "total_steps": 33920, "loss": 0.304, "lr": 2.799638788829354e-06, "epoch": 13.611438679245284, "percentage": 68.06, "elapsed_time": "0:43:58", "remaining_time": "0:20:38", "throughput": 5714.13, "total_tokens": 15077768} {"current_steps": 23090, "total_steps": 33920, "loss": 0.2506, "lr": 2.7973288797443367e-06, "epoch": 13.61438679245283, "percentage": 68.07, "elapsed_time": "0:43:59", "remaining_time": "0:20:37", "throughput": 5714.2, "total_tokens": 15080712} {"current_steps": 23095, "total_steps": 33920, "loss": 0.2947, "lr": 2.7950195538259884e-06, "epoch": 13.617334905660378, "percentage": 68.09, "elapsed_time": "0:43:59", "remaining_time": "0:20:37", "throughput": 5714.23, "total_tokens": 15083560} {"current_steps": 23100, "total_steps": 33920, "loss": 0.2852, "lr": 2.792710811685719e-06, "epoch": 13.620283018867925, "percentage": 68.1, "elapsed_time": "0:44:00", "remaining_time": "0:20:36", "throughput": 5714.39, "total_tokens": 15087240} {"current_steps": 23105, "total_steps": 33920, "loss": 0.2911, "lr": 2.7904026539347743e-06, "epoch": 13.623231132075471, "percentage": 68.12, "elapsed_time": "0:44:00", "remaining_time": "0:20:36", "throughput": 5714.48, "total_tokens": 15090440} {"current_steps": 23110, "total_steps": 33920, "loss": 0.4361, "lr": 2.7880950811842507e-06, "epoch": 13.62617924528302, "percentage": 68.13, "elapsed_time": "0:44:01", "remaining_time": "0:20:35", "throughput": 5714.52, "total_tokens": 15093992} {"current_steps": 23115, "total_steps": 33920, "loss": 0.4104, "lr": 2.785788094045085e-06, "epoch": 13.629127358490566, "percentage": 68.15, "elapsed_time": "0:44:01", "remaining_time": "0:20:34", "throughput": 5714.54, "total_tokens": 15096904} {"current_steps": 23120, "total_steps": 33920, "loss": 0.2685, "lr": 2.7834816931280655e-06, "epoch": 13.632075471698114, "percentage": 68.16, "elapsed_time": "0:44:02", "remaining_time": "0:20:34", "throughput": 5714.59, "total_tokens": 15100168} {"current_steps": 23125, "total_steps": 33920, "loss": 0.4806, "lr": 2.781175879043821e-06, "epoch": 13.63502358490566, "percentage": 68.18, "elapsed_time": "0:44:02", "remaining_time": "0:20:33", "throughput": 5714.42, "total_tokens": 15102728} {"current_steps": 23130, "total_steps": 33920, "loss": 0.3423, "lr": 2.778870652402825e-06, "epoch": 13.637971698113208, "percentage": 68.19, "elapsed_time": "0:44:03", "remaining_time": "0:20:33", "throughput": 5714.35, "total_tokens": 15105544} {"current_steps": 23135, "total_steps": 33920, "loss": 0.3124, "lr": 2.776566013815396e-06, "epoch": 13.640919811320755, "percentage": 68.2, "elapsed_time": "0:44:03", "remaining_time": "0:20:32", "throughput": 5714.52, "total_tokens": 15109096} {"current_steps": 23140, "total_steps": 33920, "loss": 0.3938, "lr": 2.774261963891698e-06, "epoch": 13.643867924528301, "percentage": 68.22, "elapsed_time": "0:44:04", "remaining_time": "0:20:31", "throughput": 5714.73, "total_tokens": 15112840} {"current_steps": 23145, "total_steps": 33920, "loss": 0.3108, "lr": 2.771958503241735e-06, "epoch": 13.64681603773585, "percentage": 68.23, "elapsed_time": "0:44:05", "remaining_time": "0:20:31", "throughput": 5714.86, "total_tokens": 15116200} {"current_steps": 23150, "total_steps": 33920, "loss": 0.4542, "lr": 2.769655632475362e-06, "epoch": 13.649764150943396, "percentage": 68.25, "elapsed_time": "0:44:05", "remaining_time": "0:20:30", "throughput": 5714.74, "total_tokens": 15118728} {"current_steps": 23155, "total_steps": 33920, "loss": 0.3012, "lr": 2.7673533522022733e-06, "epoch": 13.652712264150944, "percentage": 68.26, "elapsed_time": "0:44:06", "remaining_time": "0:20:30", "throughput": 5714.72, "total_tokens": 15121896} {"current_steps": 23160, "total_steps": 33920, "loss": 0.3006, "lr": 2.765051663032007e-06, "epoch": 13.65566037735849, "percentage": 68.28, "elapsed_time": "0:44:06", "remaining_time": "0:20:29", "throughput": 5714.56, "total_tokens": 15124232} {"current_steps": 23165, "total_steps": 33920, "loss": 0.249, "lr": 2.7627505655739446e-06, "epoch": 13.658608490566039, "percentage": 68.29, "elapsed_time": "0:44:07", "remaining_time": "0:20:28", "throughput": 5714.53, "total_tokens": 15126984} {"current_steps": 23170, "total_steps": 33920, "loss": 0.391, "lr": 2.7604500604373097e-06, "epoch": 13.661556603773585, "percentage": 68.31, "elapsed_time": "0:44:07", "remaining_time": "0:20:28", "throughput": 5714.67, "total_tokens": 15130664} {"current_steps": 23175, "total_steps": 33920, "loss": 0.3589, "lr": 2.7581501482311757e-06, "epoch": 13.664504716981131, "percentage": 68.32, "elapsed_time": "0:44:08", "remaining_time": "0:20:27", "throughput": 5714.62, "total_tokens": 15133320} {"current_steps": 23180, "total_steps": 33920, "loss": 0.2966, "lr": 2.7558508295644513e-06, "epoch": 13.66745283018868, "percentage": 68.34, "elapsed_time": "0:44:08", "remaining_time": "0:20:27", "throughput": 5714.71, "total_tokens": 15136552} {"current_steps": 23185, "total_steps": 33920, "loss": 0.2632, "lr": 2.7535521050458922e-06, "epoch": 13.670400943396226, "percentage": 68.35, "elapsed_time": "0:44:09", "remaining_time": "0:20:26", "throughput": 5714.89, "total_tokens": 15143208} {"current_steps": 23190, "total_steps": 33920, "loss": 0.2723, "lr": 2.7512539752840926e-06, "epoch": 13.673349056603774, "percentage": 68.37, "elapsed_time": "0:44:10", "remaining_time": "0:20:26", "throughput": 5714.98, "total_tokens": 15147240} {"current_steps": 23195, "total_steps": 33920, "loss": 0.4407, "lr": 2.748956440887497e-06, "epoch": 13.67629716981132, "percentage": 68.38, "elapsed_time": "0:44:10", "remaining_time": "0:20:25", "throughput": 5714.83, "total_tokens": 15149736} {"current_steps": 23200, "total_steps": 33920, "loss": 0.3704, "lr": 2.7466595024643843e-06, "epoch": 13.679245283018869, "percentage": 68.4, "elapsed_time": "0:44:11", "remaining_time": "0:20:25", "throughput": 5714.89, "total_tokens": 15152872} {"current_steps": 23205, "total_steps": 33920, "loss": 0.4685, "lr": 2.744363160622878e-06, "epoch": 13.682193396226415, "percentage": 68.41, "elapsed_time": "0:44:11", "remaining_time": "0:20:24", "throughput": 5714.89, "total_tokens": 15155752} {"current_steps": 23210, "total_steps": 33920, "loss": 0.3259, "lr": 2.742067415970948e-06, "epoch": 13.685141509433961, "percentage": 68.43, "elapsed_time": "0:44:12", "remaining_time": "0:20:23", "throughput": 5714.89, "total_tokens": 15158600} {"current_steps": 23215, "total_steps": 33920, "loss": 0.3177, "lr": 2.739772269116402e-06, "epoch": 13.68808962264151, "percentage": 68.44, "elapsed_time": "0:44:13", "remaining_time": "0:20:23", "throughput": 5714.82, "total_tokens": 15161608} {"current_steps": 23220, "total_steps": 33920, "loss": 0.3805, "lr": 2.7374777206668874e-06, "epoch": 13.691037735849056, "percentage": 68.46, "elapsed_time": "0:44:13", "remaining_time": "0:20:22", "throughput": 5714.72, "total_tokens": 15164232} {"current_steps": 23225, "total_steps": 33920, "loss": 0.4193, "lr": 2.735183771229898e-06, "epoch": 13.693985849056604, "percentage": 68.47, "elapsed_time": "0:44:14", "remaining_time": "0:20:22", "throughput": 5714.73, "total_tokens": 15167240} {"current_steps": 23230, "total_steps": 33920, "loss": 0.2843, "lr": 2.732890421412765e-06, "epoch": 13.69693396226415, "percentage": 68.48, "elapsed_time": "0:44:14", "remaining_time": "0:20:21", "throughput": 5714.7, "total_tokens": 15170568} {"current_steps": 23235, "total_steps": 33920, "loss": 0.5135, "lr": 2.7305976718226624e-06, "epoch": 13.699882075471699, "percentage": 68.5, "elapsed_time": "0:44:15", "remaining_time": "0:20:21", "throughput": 5714.98, "total_tokens": 15175144} {"current_steps": 23240, "total_steps": 33920, "loss": 0.3248, "lr": 2.728305523066609e-06, "epoch": 13.702830188679245, "percentage": 68.51, "elapsed_time": "0:44:15", "remaining_time": "0:20:20", "throughput": 5715.07, "total_tokens": 15178664} {"current_steps": 23245, "total_steps": 33920, "loss": 0.2745, "lr": 2.726013975751458e-06, "epoch": 13.705778301886792, "percentage": 68.53, "elapsed_time": "0:44:16", "remaining_time": "0:20:19", "throughput": 5714.9, "total_tokens": 15181160} {"current_steps": 23250, "total_steps": 33920, "loss": 0.3392, "lr": 2.723723030483908e-06, "epoch": 13.70872641509434, "percentage": 68.54, "elapsed_time": "0:44:16", "remaining_time": "0:20:19", "throughput": 5714.89, "total_tokens": 15184392} {"current_steps": 23255, "total_steps": 33920, "loss": 0.3636, "lr": 2.7214326878704953e-06, "epoch": 13.711674528301886, "percentage": 68.56, "elapsed_time": "0:44:17", "remaining_time": "0:20:18", "throughput": 5715.02, "total_tokens": 15188520} {"current_steps": 23260, "total_steps": 33920, "loss": 0.3898, "lr": 2.7191429485175993e-06, "epoch": 13.714622641509434, "percentage": 68.57, "elapsed_time": "0:44:18", "remaining_time": "0:20:18", "throughput": 5714.9, "total_tokens": 15191016} {"current_steps": 23265, "total_steps": 33920, "loss": 0.2562, "lr": 2.716853813031435e-06, "epoch": 13.71757075471698, "percentage": 68.59, "elapsed_time": "0:44:18", "remaining_time": "0:20:17", "throughput": 5714.96, "total_tokens": 15194248} {"current_steps": 23270, "total_steps": 33920, "loss": 0.4399, "lr": 2.714565282018066e-06, "epoch": 13.720518867924529, "percentage": 68.6, "elapsed_time": "0:44:19", "remaining_time": "0:20:17", "throughput": 5715.03, "total_tokens": 15197288} {"current_steps": 23275, "total_steps": 33920, "loss": 0.2981, "lr": 2.7122773560833877e-06, "epoch": 13.723466981132075, "percentage": 68.62, "elapsed_time": "0:44:19", "remaining_time": "0:20:16", "throughput": 5715.18, "total_tokens": 15200904} {"current_steps": 23280, "total_steps": 33920, "loss": 0.2533, "lr": 2.709990035833139e-06, "epoch": 13.726415094339622, "percentage": 68.63, "elapsed_time": "0:44:20", "remaining_time": "0:20:15", "throughput": 5715.2, "total_tokens": 15204072} {"current_steps": 23285, "total_steps": 33920, "loss": 0.4192, "lr": 2.707703321872896e-06, "epoch": 13.72936320754717, "percentage": 68.65, "elapsed_time": "0:44:20", "remaining_time": "0:20:15", "throughput": 5715.23, "total_tokens": 15207144} {"current_steps": 23290, "total_steps": 33920, "loss": 0.3169, "lr": 2.705417214808079e-06, "epoch": 13.732311320754716, "percentage": 68.66, "elapsed_time": "0:44:21", "remaining_time": "0:20:14", "throughput": 5715.1, "total_tokens": 15209832} {"current_steps": 23295, "total_steps": 33920, "loss": 0.3322, "lr": 2.703131715243945e-06, "epoch": 13.735259433962264, "percentage": 68.68, "elapsed_time": "0:44:21", "remaining_time": "0:20:14", "throughput": 5715.07, "total_tokens": 15212648} {"current_steps": 23300, "total_steps": 33920, "loss": 0.278, "lr": 2.7008468237855855e-06, "epoch": 13.73820754716981, "percentage": 68.69, "elapsed_time": "0:44:22", "remaining_time": "0:20:13", "throughput": 5715.1, "total_tokens": 15216168} {"current_steps": 23305, "total_steps": 33920, "loss": 0.3287, "lr": 2.69856254103794e-06, "epoch": 13.741155660377359, "percentage": 68.71, "elapsed_time": "0:44:22", "remaining_time": "0:20:12", "throughput": 5715.07, "total_tokens": 15218888} {"current_steps": 23310, "total_steps": 33920, "loss": 0.3739, "lr": 2.6962788676057806e-06, "epoch": 13.744103773584905, "percentage": 68.72, "elapsed_time": "0:44:23", "remaining_time": "0:20:12", "throughput": 5714.98, "total_tokens": 15221672} {"current_steps": 23315, "total_steps": 33920, "loss": 0.3131, "lr": 2.69399580409372e-06, "epoch": 13.747051886792454, "percentage": 68.74, "elapsed_time": "0:44:24", "remaining_time": "0:20:11", "throughput": 5715.16, "total_tokens": 15225352} {"current_steps": 23320, "total_steps": 33920, "loss": 0.3032, "lr": 2.6917133511062076e-06, "epoch": 13.75, "percentage": 68.75, "elapsed_time": "0:44:24", "remaining_time": "0:20:11", "throughput": 5715.23, "total_tokens": 15228264} {"current_steps": 23325, "total_steps": 33920, "loss": 0.4379, "lr": 2.6894315092475342e-06, "epoch": 13.752948113207546, "percentage": 68.76, "elapsed_time": "0:44:25", "remaining_time": "0:20:10", "throughput": 5715.37, "total_tokens": 15231560} {"current_steps": 23330, "total_steps": 33920, "loss": 0.2724, "lr": 2.6871502791218245e-06, "epoch": 13.755896226415095, "percentage": 68.78, "elapsed_time": "0:44:25", "remaining_time": "0:20:10", "throughput": 5715.52, "total_tokens": 15237192} {"current_steps": 23335, "total_steps": 33920, "loss": 0.4597, "lr": 2.684869661333048e-06, "epoch": 13.758844339622641, "percentage": 68.79, "elapsed_time": "0:44:26", "remaining_time": "0:20:09", "throughput": 5715.57, "total_tokens": 15240200} {"current_steps": 23340, "total_steps": 33920, "loss": 0.3341, "lr": 2.6825896564850074e-06, "epoch": 13.76179245283019, "percentage": 68.81, "elapsed_time": "0:44:27", "remaining_time": "0:20:08", "throughput": 5715.59, "total_tokens": 15243528} {"current_steps": 23345, "total_steps": 33920, "loss": 0.3714, "lr": 2.6803102651813416e-06, "epoch": 13.764740566037736, "percentage": 68.82, "elapsed_time": "0:44:27", "remaining_time": "0:20:08", "throughput": 5715.49, "total_tokens": 15246120} {"current_steps": 23350, "total_steps": 33920, "loss": 0.2401, "lr": 2.6780314880255307e-06, "epoch": 13.767688679245284, "percentage": 68.84, "elapsed_time": "0:44:28", "remaining_time": "0:20:07", "throughput": 5715.62, "total_tokens": 15249896} {"current_steps": 23355, "total_steps": 33920, "loss": 0.3649, "lr": 2.675753325620891e-06, "epoch": 13.77063679245283, "percentage": 68.85, "elapsed_time": "0:44:28", "remaining_time": "0:20:07", "throughput": 5715.8, "total_tokens": 15253576} {"current_steps": 23360, "total_steps": 33920, "loss": 0.3845, "lr": 2.6734757785705727e-06, "epoch": 13.773584905660378, "percentage": 68.87, "elapsed_time": "0:44:29", "remaining_time": "0:20:06", "throughput": 5715.9, "total_tokens": 15257320} {"current_steps": 23365, "total_steps": 33920, "loss": 0.4991, "lr": 2.6711988474775712e-06, "epoch": 13.776533018867925, "percentage": 68.88, "elapsed_time": "0:44:29", "remaining_time": "0:20:06", "throughput": 5715.98, "total_tokens": 15260872} {"current_steps": 23370, "total_steps": 33920, "loss": 0.2537, "lr": 2.668922532944711e-06, "epoch": 13.779481132075471, "percentage": 68.9, "elapsed_time": "0:44:30", "remaining_time": "0:20:05", "throughput": 5715.96, "total_tokens": 15263976} {"current_steps": 23375, "total_steps": 33920, "loss": 0.4049, "lr": 2.6666468355746566e-06, "epoch": 13.78242924528302, "percentage": 68.91, "elapsed_time": "0:44:30", "remaining_time": "0:20:04", "throughput": 5716.1, "total_tokens": 15267336} {"current_steps": 23380, "total_steps": 33920, "loss": 0.3734, "lr": 2.6643717559699073e-06, "epoch": 13.785377358490566, "percentage": 68.93, "elapsed_time": "0:44:31", "remaining_time": "0:20:04", "throughput": 5716.09, "total_tokens": 15270312} {"current_steps": 23385, "total_steps": 33920, "loss": 0.3298, "lr": 2.662097294732803e-06, "epoch": 13.788325471698114, "percentage": 68.94, "elapsed_time": "0:44:31", "remaining_time": "0:20:03", "throughput": 5716.02, "total_tokens": 15273192} {"current_steps": 23390, "total_steps": 33920, "loss": 0.3202, "lr": 2.6598234524655165e-06, "epoch": 13.79127358490566, "percentage": 68.96, "elapsed_time": "0:44:32", "remaining_time": "0:20:03", "throughput": 5715.85, "total_tokens": 15275624} {"current_steps": 23395, "total_steps": 33920, "loss": 0.3269, "lr": 2.657550229770054e-06, "epoch": 13.794221698113208, "percentage": 68.97, "elapsed_time": "0:44:33", "remaining_time": "0:20:02", "throughput": 5715.89, "total_tokens": 15278760} {"current_steps": 23400, "total_steps": 33920, "loss": 0.2838, "lr": 2.655277627248265e-06, "epoch": 13.797169811320755, "percentage": 68.99, "elapsed_time": "0:44:33", "remaining_time": "0:20:02", "throughput": 5716.17, "total_tokens": 15283080} {"current_steps": 23405, "total_steps": 33920, "loss": 0.3196, "lr": 2.65300564550183e-06, "epoch": 13.800117924528301, "percentage": 69.0, "elapsed_time": "0:44:34", "remaining_time": "0:20:01", "throughput": 5716.07, "total_tokens": 15285768} {"current_steps": 23410, "total_steps": 33920, "loss": 0.3361, "lr": 2.6507342851322647e-06, "epoch": 13.80306603773585, "percentage": 69.02, "elapsed_time": "0:44:34", "remaining_time": "0:20:00", "throughput": 5716.04, "total_tokens": 15288616} {"current_steps": 23415, "total_steps": 33920, "loss": 0.3475, "lr": 2.6484635467409233e-06, "epoch": 13.806014150943396, "percentage": 69.03, "elapsed_time": "0:44:35", "remaining_time": "0:20:00", "throughput": 5716.16, "total_tokens": 15292264} {"current_steps": 23420, "total_steps": 33920, "loss": 0.3056, "lr": 2.64619343092899e-06, "epoch": 13.808962264150944, "percentage": 69.04, "elapsed_time": "0:44:35", "remaining_time": "0:19:59", "throughput": 5716.02, "total_tokens": 15294664} {"current_steps": 23425, "total_steps": 33920, "loss": 0.3491, "lr": 2.643923938297492e-06, "epoch": 13.81191037735849, "percentage": 69.06, "elapsed_time": "0:44:36", "remaining_time": "0:19:59", "throughput": 5715.98, "total_tokens": 15297288} {"current_steps": 23430, "total_steps": 33920, "loss": 0.2772, "lr": 2.6416550694472855e-06, "epoch": 13.814858490566039, "percentage": 69.07, "elapsed_time": "0:44:36", "remaining_time": "0:19:58", "throughput": 5715.98, "total_tokens": 15300328} {"current_steps": 23435, "total_steps": 33920, "loss": 0.3236, "lr": 2.639386824979063e-06, "epoch": 13.817806603773585, "percentage": 69.09, "elapsed_time": "0:44:37", "remaining_time": "0:19:57", "throughput": 5716.04, "total_tokens": 15303720} {"current_steps": 23440, "total_steps": 33920, "loss": 0.3114, "lr": 2.6371192054933525e-06, "epoch": 13.820754716981131, "percentage": 69.1, "elapsed_time": "0:44:37", "remaining_time": "0:19:57", "throughput": 5716.1, "total_tokens": 15306824} {"current_steps": 23445, "total_steps": 33920, "loss": 0.3862, "lr": 2.634852211590516e-06, "epoch": 13.82370283018868, "percentage": 69.12, "elapsed_time": "0:44:38", "remaining_time": "0:19:56", "throughput": 5716.26, "total_tokens": 15310472} {"current_steps": 23450, "total_steps": 33920, "loss": 0.3303, "lr": 2.6325858438707473e-06, "epoch": 13.826650943396226, "percentage": 69.13, "elapsed_time": "0:44:38", "remaining_time": "0:19:56", "throughput": 5716.37, "total_tokens": 15313896} {"current_steps": 23455, "total_steps": 33920, "loss": 0.3356, "lr": 2.630320102934082e-06, "epoch": 13.829599056603774, "percentage": 69.15, "elapsed_time": "0:44:39", "remaining_time": "0:19:55", "throughput": 5716.38, "total_tokens": 15316712} {"current_steps": 23460, "total_steps": 33920, "loss": 0.2678, "lr": 2.628054989380382e-06, "epoch": 13.83254716981132, "percentage": 69.16, "elapsed_time": "0:44:40", "remaining_time": "0:19:54", "throughput": 5716.53, "total_tokens": 15320360} {"current_steps": 23465, "total_steps": 33920, "loss": 0.4571, "lr": 2.625790503809346e-06, "epoch": 13.835495283018869, "percentage": 69.18, "elapsed_time": "0:44:40", "remaining_time": "0:19:54", "throughput": 5716.46, "total_tokens": 15322952} {"current_steps": 23470, "total_steps": 33920, "loss": 0.3216, "lr": 2.6235266468205067e-06, "epoch": 13.838443396226415, "percentage": 69.19, "elapsed_time": "0:44:41", "remaining_time": "0:19:53", "throughput": 5716.65, "total_tokens": 15327080} {"current_steps": 23475, "total_steps": 33920, "loss": 0.4281, "lr": 2.621263419013227e-06, "epoch": 13.841391509433961, "percentage": 69.21, "elapsed_time": "0:44:41", "remaining_time": "0:19:53", "throughput": 5716.59, "total_tokens": 15329640} {"current_steps": 23480, "total_steps": 33920, "loss": 0.2933, "lr": 2.619000820986711e-06, "epoch": 13.84433962264151, "percentage": 69.22, "elapsed_time": "0:44:42", "remaining_time": "0:19:52", "throughput": 5716.54, "total_tokens": 15332232} {"current_steps": 23485, "total_steps": 33920, "loss": 0.3308, "lr": 2.616738853339988e-06, "epoch": 13.847287735849056, "percentage": 69.24, "elapsed_time": "0:44:42", "remaining_time": "0:19:51", "throughput": 5716.56, "total_tokens": 15335560} {"current_steps": 23490, "total_steps": 33920, "loss": 0.3435, "lr": 2.614477516671926e-06, "epoch": 13.850235849056604, "percentage": 69.25, "elapsed_time": "0:44:43", "remaining_time": "0:19:51", "throughput": 5716.58, "total_tokens": 15338536} {"current_steps": 23495, "total_steps": 33920, "loss": 0.3345, "lr": 2.612216811581223e-06, "epoch": 13.85318396226415, "percentage": 69.27, "elapsed_time": "0:44:43", "remaining_time": "0:19:50", "throughput": 5716.73, "total_tokens": 15342216} {"current_steps": 23500, "total_steps": 33920, "loss": 0.4646, "lr": 2.6099567386664095e-06, "epoch": 13.856132075471699, "percentage": 69.28, "elapsed_time": "0:44:44", "remaining_time": "0:19:50", "throughput": 5716.81, "total_tokens": 15345544} {"current_steps": 23505, "total_steps": 33920, "loss": 0.3374, "lr": 2.60769729852585e-06, "epoch": 13.859080188679245, "percentage": 69.3, "elapsed_time": "0:44:44", "remaining_time": "0:19:49", "throughput": 5716.79, "total_tokens": 15348296} {"current_steps": 23510, "total_steps": 33920, "loss": 0.2977, "lr": 2.6054384917577413e-06, "epoch": 13.862028301886792, "percentage": 69.31, "elapsed_time": "0:44:45", "remaining_time": "0:19:49", "throughput": 5716.88, "total_tokens": 15351560} {"current_steps": 23515, "total_steps": 33920, "loss": 0.3796, "lr": 2.60318031896011e-06, "epoch": 13.86497641509434, "percentage": 69.32, "elapsed_time": "0:44:45", "remaining_time": "0:19:48", "throughput": 5716.9, "total_tokens": 15354600} {"current_steps": 23520, "total_steps": 33920, "loss": 0.3804, "lr": 2.60092278073082e-06, "epoch": 13.867924528301886, "percentage": 69.34, "elapsed_time": "0:44:46", "remaining_time": "0:19:47", "throughput": 5716.83, "total_tokens": 15357352} {"current_steps": 23525, "total_steps": 33920, "loss": 0.5134, "lr": 2.5986658776675644e-06, "epoch": 13.870872641509434, "percentage": 69.35, "elapsed_time": "0:44:46", "remaining_time": "0:19:47", "throughput": 5716.97, "total_tokens": 15360872} {"current_steps": 23530, "total_steps": 33920, "loss": 0.254, "lr": 2.5964096103678666e-06, "epoch": 13.87382075471698, "percentage": 69.37, "elapsed_time": "0:44:47", "remaining_time": "0:19:46", "throughput": 5716.89, "total_tokens": 15363496} {"current_steps": 23535, "total_steps": 33920, "loss": 0.3577, "lr": 2.5941539794290833e-06, "epoch": 13.876768867924529, "percentage": 69.38, "elapsed_time": "0:44:47", "remaining_time": "0:19:46", "throughput": 5716.85, "total_tokens": 15366568} {"current_steps": 23540, "total_steps": 33920, "loss": 0.3424, "lr": 2.5918989854484024e-06, "epoch": 13.879716981132075, "percentage": 69.4, "elapsed_time": "0:44:48", "remaining_time": "0:19:45", "throughput": 5716.96, "total_tokens": 15370248} {"current_steps": 23545, "total_steps": 33920, "loss": 0.2838, "lr": 2.5896446290228417e-06, "epoch": 13.882665094339622, "percentage": 69.41, "elapsed_time": "0:44:49", "remaining_time": "0:19:44", "throughput": 5717.04, "total_tokens": 15373352} {"current_steps": 23550, "total_steps": 33920, "loss": 0.2772, "lr": 2.5873909107492547e-06, "epoch": 13.88561320754717, "percentage": 69.43, "elapsed_time": "0:44:49", "remaining_time": "0:19:44", "throughput": 5717.13, "total_tokens": 15376552} {"current_steps": 23555, "total_steps": 33920, "loss": 0.4325, "lr": 2.5851378312243224e-06, "epoch": 13.888561320754716, "percentage": 69.44, "elapsed_time": "0:44:50", "remaining_time": "0:19:43", "throughput": 5717.18, "total_tokens": 15380232} {"current_steps": 23560, "total_steps": 33920, "loss": 0.3464, "lr": 2.5828853910445572e-06, "epoch": 13.891509433962264, "percentage": 69.46, "elapsed_time": "0:44:50", "remaining_time": "0:19:43", "throughput": 5717.29, "total_tokens": 15383592} {"current_steps": 23565, "total_steps": 33920, "loss": 0.3864, "lr": 2.5806335908063012e-06, "epoch": 13.89445754716981, "percentage": 69.47, "elapsed_time": "0:44:51", "remaining_time": "0:19:42", "throughput": 5717.09, "total_tokens": 15385768} {"current_steps": 23570, "total_steps": 33920, "loss": 0.4094, "lr": 2.5783824311057293e-06, "epoch": 13.897405660377359, "percentage": 69.49, "elapsed_time": "0:44:51", "remaining_time": "0:19:41", "throughput": 5717.13, "total_tokens": 15389032} {"current_steps": 23575, "total_steps": 33920, "loss": 0.3565, "lr": 2.5761319125388433e-06, "epoch": 13.900353773584905, "percentage": 69.5, "elapsed_time": "0:44:52", "remaining_time": "0:19:41", "throughput": 5717.37, "total_tokens": 15393000} {"current_steps": 23580, "total_steps": 33920, "loss": 0.3611, "lr": 2.57388203570148e-06, "epoch": 13.903301886792454, "percentage": 69.52, "elapsed_time": "0:44:52", "remaining_time": "0:19:40", "throughput": 5717.5, "total_tokens": 15396648} {"current_steps": 23585, "total_steps": 33920, "loss": 0.4393, "lr": 2.5716328011893055e-06, "epoch": 13.90625, "percentage": 69.53, "elapsed_time": "0:44:53", "remaining_time": "0:19:40", "throughput": 5717.46, "total_tokens": 15399496} {"current_steps": 23590, "total_steps": 33920, "loss": 0.3381, "lr": 2.5693842095978127e-06, "epoch": 13.909198113207546, "percentage": 69.55, "elapsed_time": "0:44:53", "remaining_time": "0:19:39", "throughput": 5717.5, "total_tokens": 15402504} {"current_steps": 23595, "total_steps": 33920, "loss": 0.2975, "lr": 2.567136261522325e-06, "epoch": 13.912146226415095, "percentage": 69.56, "elapsed_time": "0:44:54", "remaining_time": "0:19:39", "throughput": 5717.62, "total_tokens": 15405896} {"current_steps": 23600, "total_steps": 33920, "loss": 0.3256, "lr": 2.5648889575579985e-06, "epoch": 13.915094339622641, "percentage": 69.58, "elapsed_time": "0:44:55", "remaining_time": "0:19:38", "throughput": 5717.7, "total_tokens": 15409640} {"current_steps": 23605, "total_steps": 33920, "loss": 0.3153, "lr": 2.562642298299814e-06, "epoch": 13.91804245283019, "percentage": 69.59, "elapsed_time": "0:44:55", "remaining_time": "0:19:37", "throughput": 5717.75, "total_tokens": 15412520} {"current_steps": 23610, "total_steps": 33920, "loss": 0.4431, "lr": 2.560396284342584e-06, "epoch": 13.920990566037736, "percentage": 69.6, "elapsed_time": "0:44:56", "remaining_time": "0:19:37", "throughput": 5717.83, "total_tokens": 15415560} {"current_steps": 23615, "total_steps": 33920, "loss": 0.3398, "lr": 2.558150916280954e-06, "epoch": 13.923938679245284, "percentage": 69.62, "elapsed_time": "0:44:56", "remaining_time": "0:19:36", "throughput": 5717.69, "total_tokens": 15418216} {"current_steps": 23620, "total_steps": 33920, "loss": 0.3278, "lr": 2.555906194709392e-06, "epoch": 13.92688679245283, "percentage": 69.63, "elapsed_time": "0:44:57", "remaining_time": "0:19:36", "throughput": 5717.8, "total_tokens": 15421512} {"current_steps": 23625, "total_steps": 33920, "loss": 0.2963, "lr": 2.553662120222199e-06, "epoch": 13.929834905660378, "percentage": 69.65, "elapsed_time": "0:44:57", "remaining_time": "0:19:35", "throughput": 5717.83, "total_tokens": 15424712} {"current_steps": 23630, "total_steps": 33920, "loss": 0.3759, "lr": 2.5514186934135026e-06, "epoch": 13.932783018867925, "percentage": 69.66, "elapsed_time": "0:44:58", "remaining_time": "0:19:34", "throughput": 5717.93, "total_tokens": 15428360} {"current_steps": 23635, "total_steps": 33920, "loss": 0.2503, "lr": 2.54917591487726e-06, "epoch": 13.935731132075471, "percentage": 69.68, "elapsed_time": "0:44:58", "remaining_time": "0:19:34", "throughput": 5718.09, "total_tokens": 15432392} {"current_steps": 23640, "total_steps": 33920, "loss": 0.3489, "lr": 2.5469337852072547e-06, "epoch": 13.93867924528302, "percentage": 69.69, "elapsed_time": "0:44:59", "remaining_time": "0:19:33", "throughput": 5718.19, "total_tokens": 15436136} {"current_steps": 23645, "total_steps": 33920, "loss": 0.4321, "lr": 2.5446923049971035e-06, "epoch": 13.941627358490566, "percentage": 69.71, "elapsed_time": "0:44:59", "remaining_time": "0:19:33", "throughput": 5718.16, "total_tokens": 15438792} {"current_steps": 23650, "total_steps": 33920, "loss": 0.2789, "lr": 2.5424514748402463e-06, "epoch": 13.944575471698114, "percentage": 69.72, "elapsed_time": "0:45:00", "remaining_time": "0:19:32", "throughput": 5718.07, "total_tokens": 15441352} {"current_steps": 23655, "total_steps": 33920, "loss": 0.3534, "lr": 2.540211295329953e-06, "epoch": 13.94752358490566, "percentage": 69.74, "elapsed_time": "0:45:00", "remaining_time": "0:19:32", "throughput": 5717.98, "total_tokens": 15443720} {"current_steps": 23660, "total_steps": 33920, "loss": 0.3427, "lr": 2.5379717670593197e-06, "epoch": 13.950471698113208, "percentage": 69.75, "elapsed_time": "0:45:01", "remaining_time": "0:19:31", "throughput": 5718.12, "total_tokens": 15447016} {"current_steps": 23665, "total_steps": 33920, "loss": 0.3692, "lr": 2.53573289062127e-06, "epoch": 13.953419811320755, "percentage": 69.77, "elapsed_time": "0:45:01", "remaining_time": "0:19:30", "throughput": 5718.1, "total_tokens": 15450024} {"current_steps": 23670, "total_steps": 33920, "loss": 0.3301, "lr": 2.5334946666085605e-06, "epoch": 13.956367924528301, "percentage": 69.78, "elapsed_time": "0:45:02", "remaining_time": "0:19:30", "throughput": 5718.21, "total_tokens": 15453576} {"current_steps": 23675, "total_steps": 33920, "loss": 0.2432, "lr": 2.531257095613766e-06, "epoch": 13.95931603773585, "percentage": 69.8, "elapsed_time": "0:45:03", "remaining_time": "0:19:29", "throughput": 5718.4, "total_tokens": 15457480} {"current_steps": 23680, "total_steps": 33920, "loss": 0.278, "lr": 2.529020178229297e-06, "epoch": 13.962264150943396, "percentage": 69.81, "elapsed_time": "0:45:03", "remaining_time": "0:19:29", "throughput": 5718.49, "total_tokens": 15461000} {"current_steps": 23685, "total_steps": 33920, "loss": 0.3695, "lr": 2.5267839150473846e-06, "epoch": 13.965212264150944, "percentage": 69.83, "elapsed_time": "0:45:04", "remaining_time": "0:19:28", "throughput": 5718.7, "total_tokens": 15464712} {"current_steps": 23690, "total_steps": 33920, "loss": 0.4236, "lr": 2.5245483066600896e-06, "epoch": 13.96816037735849, "percentage": 69.84, "elapsed_time": "0:45:04", "remaining_time": "0:19:28", "throughput": 5718.87, "total_tokens": 15468648} {"current_steps": 23695, "total_steps": 33920, "loss": 0.2932, "lr": 2.5223133536592996e-06, "epoch": 13.971108490566039, "percentage": 69.86, "elapsed_time": "0:45:05", "remaining_time": "0:19:27", "throughput": 5718.8, "total_tokens": 15471240} {"current_steps": 23700, "total_steps": 33920, "loss": 0.308, "lr": 2.520079056636725e-06, "epoch": 13.974056603773585, "percentage": 69.87, "elapsed_time": "0:45:05", "remaining_time": "0:19:26", "throughput": 5718.93, "total_tokens": 15474824} {"current_steps": 23705, "total_steps": 33920, "loss": 0.2688, "lr": 2.5178454161839106e-06, "epoch": 13.977004716981131, "percentage": 69.89, "elapsed_time": "0:45:06", "remaining_time": "0:19:26", "throughput": 5718.87, "total_tokens": 15477608} {"current_steps": 23710, "total_steps": 33920, "loss": 0.3269, "lr": 2.5156124328922195e-06, "epoch": 13.97995283018868, "percentage": 69.9, "elapsed_time": "0:45:06", "remaining_time": "0:19:25", "throughput": 5718.9, "total_tokens": 15480872} {"current_steps": 23715, "total_steps": 33920, "loss": 0.3005, "lr": 2.513380107352844e-06, "epoch": 13.982900943396226, "percentage": 69.91, "elapsed_time": "0:45:07", "remaining_time": "0:19:25", "throughput": 5718.92, "total_tokens": 15483656} {"current_steps": 23720, "total_steps": 33920, "loss": 0.2763, "lr": 2.5111484401568014e-06, "epoch": 13.985849056603774, "percentage": 69.93, "elapsed_time": "0:45:07", "remaining_time": "0:19:24", "throughput": 5719.02, "total_tokens": 15487016} {"current_steps": 23725, "total_steps": 33920, "loss": 0.3378, "lr": 2.508917431894936e-06, "epoch": 13.98879716981132, "percentage": 69.94, "elapsed_time": "0:45:08", "remaining_time": "0:19:23", "throughput": 5719.09, "total_tokens": 15489992} {"current_steps": 23730, "total_steps": 33920, "loss": 0.2797, "lr": 2.5066870831579144e-06, "epoch": 13.991745283018869, "percentage": 69.96, "elapsed_time": "0:45:08", "remaining_time": "0:19:23", "throughput": 5719.08, "total_tokens": 15492872} {"current_steps": 23735, "total_steps": 33920, "loss": 0.3308, "lr": 2.504457394536235e-06, "epoch": 13.994693396226415, "percentage": 69.97, "elapsed_time": "0:45:09", "remaining_time": "0:19:22", "throughput": 5719.02, "total_tokens": 15495496} {"current_steps": 23740, "total_steps": 33920, "loss": 0.2964, "lr": 2.502228366620216e-06, "epoch": 13.997641509433961, "percentage": 69.99, "elapsed_time": "0:45:09", "remaining_time": "0:19:22", "throughput": 5719.11, "total_tokens": 15498760} {"current_steps": 23744, "total_steps": 33920, "eval_loss": 0.5794597268104553, "epoch": 14.0, "percentage": 70.0, "elapsed_time": "0:45:29", "remaining_time": "0:19:29", "throughput": 5678.3, "total_tokens": 15500632} {"current_steps": 23745, "total_steps": 33920, "loss": 0.2296, "lr": 2.5000000000000015e-06, "epoch": 14.00058962264151, "percentage": 70.0, "elapsed_time": "0:45:33", "remaining_time": "0:19:31", "throughput": 5670.64, "total_tokens": 15501336} {"current_steps": 23750, "total_steps": 33920, "loss": 0.4409, "lr": 2.497772295265561e-06, "epoch": 14.003537735849056, "percentage": 70.02, "elapsed_time": "0:45:34", "remaining_time": "0:19:30", "throughput": 5670.77, "total_tokens": 15504728} {"current_steps": 23755, "total_steps": 33920, "loss": 0.5093, "lr": 2.4955452530066897e-06, "epoch": 14.006485849056604, "percentage": 70.03, "elapsed_time": "0:45:34", "remaining_time": "0:19:30", "throughput": 5670.77, "total_tokens": 15508280} {"current_steps": 23760, "total_steps": 33920, "loss": 0.4395, "lr": 2.4933188738130043e-06, "epoch": 14.00943396226415, "percentage": 70.05, "elapsed_time": "0:45:35", "remaining_time": "0:19:29", "throughput": 5670.75, "total_tokens": 15511224} {"current_steps": 23765, "total_steps": 33920, "loss": 0.2503, "lr": 2.49109315827395e-06, "epoch": 14.012382075471699, "percentage": 70.06, "elapsed_time": "0:45:35", "remaining_time": "0:19:29", "throughput": 5670.62, "total_tokens": 15514008} {"current_steps": 23770, "total_steps": 33920, "loss": 0.2367, "lr": 2.4888681069787975e-06, "epoch": 14.015330188679245, "percentage": 70.08, "elapsed_time": "0:45:36", "remaining_time": "0:19:28", "throughput": 5670.6, "total_tokens": 15517016} {"current_steps": 23775, "total_steps": 33920, "loss": 0.2587, "lr": 2.4866437205166353e-06, "epoch": 14.018278301886792, "percentage": 70.09, "elapsed_time": "0:45:37", "remaining_time": "0:19:27", "throughput": 5670.62, "total_tokens": 15520632} {"current_steps": 23780, "total_steps": 33920, "loss": 0.262, "lr": 2.4844199994763803e-06, "epoch": 14.02122641509434, "percentage": 70.11, "elapsed_time": "0:45:37", "remaining_time": "0:19:27", "throughput": 5670.64, "total_tokens": 15523832} {"current_steps": 23785, "total_steps": 33920, "loss": 0.3154, "lr": 2.482196944446772e-06, "epoch": 14.024174528301886, "percentage": 70.12, "elapsed_time": "0:45:38", "remaining_time": "0:19:26", "throughput": 5670.56, "total_tokens": 15526776} {"current_steps": 23790, "total_steps": 33920, "loss": 0.3213, "lr": 2.4799745560163736e-06, "epoch": 14.027122641509434, "percentage": 70.14, "elapsed_time": "0:45:38", "remaining_time": "0:19:26", "throughput": 5670.73, "total_tokens": 15530328} {"current_steps": 23795, "total_steps": 33920, "loss": 0.3617, "lr": 2.4777528347735707e-06, "epoch": 14.03007075471698, "percentage": 70.15, "elapsed_time": "0:45:39", "remaining_time": "0:19:25", "throughput": 5670.78, "total_tokens": 15533624} {"current_steps": 23800, "total_steps": 33920, "loss": 0.3075, "lr": 2.4755317813065766e-06, "epoch": 14.033018867924529, "percentage": 70.17, "elapsed_time": "0:45:39", "remaining_time": "0:19:24", "throughput": 5670.82, "total_tokens": 15536696} {"current_steps": 23805, "total_steps": 33920, "loss": 0.3541, "lr": 2.4733113962034234e-06, "epoch": 14.035966981132075, "percentage": 70.18, "elapsed_time": "0:45:40", "remaining_time": "0:19:24", "throughput": 5670.83, "total_tokens": 15539640} {"current_steps": 23810, "total_steps": 33920, "loss": 0.314, "lr": 2.4710916800519674e-06, "epoch": 14.038915094339623, "percentage": 70.19, "elapsed_time": "0:45:40", "remaining_time": "0:19:23", "throughput": 5670.82, "total_tokens": 15542648} {"current_steps": 23815, "total_steps": 33920, "loss": 0.3291, "lr": 2.4688726334398883e-06, "epoch": 14.04186320754717, "percentage": 70.21, "elapsed_time": "0:45:41", "remaining_time": "0:19:23", "throughput": 5670.84, "total_tokens": 15545912} {"current_steps": 23820, "total_steps": 33920, "loss": 0.3219, "lr": 2.466654256954688e-06, "epoch": 14.044811320754716, "percentage": 70.22, "elapsed_time": "0:45:41", "remaining_time": "0:19:22", "throughput": 5670.84, "total_tokens": 15549016} {"current_steps": 23825, "total_steps": 33920, "loss": 0.2469, "lr": 2.4644365511836895e-06, "epoch": 14.047759433962264, "percentage": 70.24, "elapsed_time": "0:45:42", "remaining_time": "0:19:22", "throughput": 5670.9, "total_tokens": 15552216} {"current_steps": 23830, "total_steps": 33920, "loss": 0.3636, "lr": 2.4622195167140432e-06, "epoch": 14.05070754716981, "percentage": 70.25, "elapsed_time": "0:45:43", "remaining_time": "0:19:21", "throughput": 5670.94, "total_tokens": 15555640} {"current_steps": 23835, "total_steps": 33920, "loss": 0.3689, "lr": 2.4600031541327173e-06, "epoch": 14.053655660377359, "percentage": 70.27, "elapsed_time": "0:45:43", "remaining_time": "0:19:20", "throughput": 5670.82, "total_tokens": 15558424} {"current_steps": 23840, "total_steps": 33920, "loss": 0.2814, "lr": 2.457787464026503e-06, "epoch": 14.056603773584905, "percentage": 70.28, "elapsed_time": "0:45:44", "remaining_time": "0:19:20", "throughput": 5670.71, "total_tokens": 15561112} {"current_steps": 23845, "total_steps": 33920, "loss": 0.2921, "lr": 2.455572446982014e-06, "epoch": 14.059551886792454, "percentage": 70.3, "elapsed_time": "0:45:44", "remaining_time": "0:19:19", "throughput": 5670.74, "total_tokens": 15564376} {"current_steps": 23850, "total_steps": 33920, "loss": 0.3222, "lr": 2.453358103585686e-06, "epoch": 14.0625, "percentage": 70.31, "elapsed_time": "0:45:45", "remaining_time": "0:19:19", "throughput": 5670.89, "total_tokens": 15567928} {"current_steps": 23855, "total_steps": 33920, "loss": 0.4102, "lr": 2.4511444344237733e-06, "epoch": 14.065448113207546, "percentage": 70.33, "elapsed_time": "0:45:46", "remaining_time": "0:19:18", "throughput": 5671.16, "total_tokens": 15574104} {"current_steps": 23860, "total_steps": 33920, "loss": 0.4085, "lr": 2.4489314400823567e-06, "epoch": 14.068396226415095, "percentage": 70.34, "elapsed_time": "0:45:46", "remaining_time": "0:19:18", "throughput": 5671.22, "total_tokens": 15577592} {"current_steps": 23865, "total_steps": 33920, "loss": 0.3375, "lr": 2.446719121147337e-06, "epoch": 14.071344339622641, "percentage": 70.36, "elapsed_time": "0:45:47", "remaining_time": "0:19:17", "throughput": 5671.19, "total_tokens": 15580600} {"current_steps": 23870, "total_steps": 33920, "loss": 0.2539, "lr": 2.4445074782044347e-06, "epoch": 14.07429245283019, "percentage": 70.37, "elapsed_time": "0:45:47", "remaining_time": "0:19:16", "throughput": 5671.06, "total_tokens": 15583224} {"current_steps": 23875, "total_steps": 33920, "loss": 0.3206, "lr": 2.442296511839191e-06, "epoch": 14.077240566037736, "percentage": 70.39, "elapsed_time": "0:45:48", "remaining_time": "0:19:16", "throughput": 5671.11, "total_tokens": 15586264} {"current_steps": 23880, "total_steps": 33920, "loss": 0.4368, "lr": 2.4400862226369687e-06, "epoch": 14.080188679245284, "percentage": 70.4, "elapsed_time": "0:45:48", "remaining_time": "0:19:15", "throughput": 5671.17, "total_tokens": 15589528} {"current_steps": 23885, "total_steps": 33920, "loss": 0.3599, "lr": 2.4378766111829514e-06, "epoch": 14.08313679245283, "percentage": 70.42, "elapsed_time": "0:45:49", "remaining_time": "0:19:15", "throughput": 5671.03, "total_tokens": 15592216} {"current_steps": 23890, "total_steps": 33920, "loss": 0.3327, "lr": 2.435667678062142e-06, "epoch": 14.086084905660377, "percentage": 70.43, "elapsed_time": "0:45:50", "remaining_time": "0:19:14", "throughput": 5671.13, "total_tokens": 15595672} {"current_steps": 23895, "total_steps": 33920, "loss": 0.3362, "lr": 2.4334594238593682e-06, "epoch": 14.089033018867925, "percentage": 70.45, "elapsed_time": "0:45:50", "remaining_time": "0:19:14", "throughput": 5671.27, "total_tokens": 15599768} {"current_steps": 23900, "total_steps": 33920, "loss": 0.3027, "lr": 2.4312518491592727e-06, "epoch": 14.091981132075471, "percentage": 70.46, "elapsed_time": "0:45:51", "remaining_time": "0:19:13", "throughput": 5671.29, "total_tokens": 15602872} {"current_steps": 23905, "total_steps": 33920, "loss": 0.3182, "lr": 2.429044954546322e-06, "epoch": 14.09492924528302, "percentage": 70.47, "elapsed_time": "0:45:51", "remaining_time": "0:19:12", "throughput": 5671.41, "total_tokens": 15606936} {"current_steps": 23910, "total_steps": 33920, "loss": 0.2793, "lr": 2.426838740604799e-06, "epoch": 14.097877358490566, "percentage": 70.49, "elapsed_time": "0:45:52", "remaining_time": "0:19:12", "throughput": 5671.43, "total_tokens": 15609752} {"current_steps": 23915, "total_steps": 33920, "loss": 0.2909, "lr": 2.4246332079188066e-06, "epoch": 14.100825471698114, "percentage": 70.5, "elapsed_time": "0:45:52", "remaining_time": "0:19:11", "throughput": 5671.55, "total_tokens": 15613720} {"current_steps": 23920, "total_steps": 33920, "loss": 0.3562, "lr": 2.4224283570722745e-06, "epoch": 14.10377358490566, "percentage": 70.52, "elapsed_time": "0:45:53", "remaining_time": "0:19:11", "throughput": 5671.51, "total_tokens": 15616632} {"current_steps": 23925, "total_steps": 33920, "loss": 0.3721, "lr": 2.420224188648943e-06, "epoch": 14.106721698113208, "percentage": 70.53, "elapsed_time": "0:45:54", "remaining_time": "0:19:10", "throughput": 5671.69, "total_tokens": 15620312} {"current_steps": 23930, "total_steps": 33920, "loss": 0.2583, "lr": 2.418020703232376e-06, "epoch": 14.109669811320755, "percentage": 70.55, "elapsed_time": "0:45:54", "remaining_time": "0:19:09", "throughput": 5671.78, "total_tokens": 15623736} {"current_steps": 23935, "total_steps": 33920, "loss": 0.3596, "lr": 2.4158179014059556e-06, "epoch": 14.112617924528301, "percentage": 70.56, "elapsed_time": "0:45:55", "remaining_time": "0:19:09", "throughput": 5671.85, "total_tokens": 15626936} {"current_steps": 23940, "total_steps": 33920, "loss": 0.3877, "lr": 2.413615783752883e-06, "epoch": 14.11556603773585, "percentage": 70.58, "elapsed_time": "0:45:55", "remaining_time": "0:19:08", "throughput": 5671.88, "total_tokens": 15630040} {"current_steps": 23945, "total_steps": 33920, "loss": 0.3231, "lr": 2.4114143508561767e-06, "epoch": 14.118514150943396, "percentage": 70.59, "elapsed_time": "0:45:56", "remaining_time": "0:19:08", "throughput": 5671.94, "total_tokens": 15633336} {"current_steps": 23950, "total_steps": 33920, "loss": 0.3425, "lr": 2.4092136032986783e-06, "epoch": 14.121462264150944, "percentage": 70.61, "elapsed_time": "0:45:56", "remaining_time": "0:19:07", "throughput": 5672.07, "total_tokens": 15636792} {"current_steps": 23955, "total_steps": 33920, "loss": 0.291, "lr": 2.407013541663043e-06, "epoch": 14.12441037735849, "percentage": 70.62, "elapsed_time": "0:45:57", "remaining_time": "0:19:07", "throughput": 5672.23, "total_tokens": 15640696} {"current_steps": 23960, "total_steps": 33920, "loss": 0.3281, "lr": 2.4048141665317493e-06, "epoch": 14.127358490566039, "percentage": 70.64, "elapsed_time": "0:45:58", "remaining_time": "0:19:06", "throughput": 5672.28, "total_tokens": 15644312} {"current_steps": 23965, "total_steps": 33920, "loss": 0.3335, "lr": 2.40261547848709e-06, "epoch": 14.130306603773585, "percentage": 70.65, "elapsed_time": "0:45:58", "remaining_time": "0:19:05", "throughput": 5672.18, "total_tokens": 15646840} {"current_steps": 23970, "total_steps": 33920, "loss": 0.2666, "lr": 2.400417478111176e-06, "epoch": 14.133254716981131, "percentage": 70.67, "elapsed_time": "0:45:59", "remaining_time": "0:19:05", "throughput": 5671.99, "total_tokens": 15649464} {"current_steps": 23975, "total_steps": 33920, "loss": 0.2872, "lr": 2.3982201659859387e-06, "epoch": 14.13620283018868, "percentage": 70.68, "elapsed_time": "0:45:59", "remaining_time": "0:19:04", "throughput": 5672.2, "total_tokens": 15653432} {"current_steps": 23980, "total_steps": 33920, "loss": 0.4049, "lr": 2.3960235426931237e-06, "epoch": 14.139150943396226, "percentage": 70.7, "elapsed_time": "0:46:00", "remaining_time": "0:19:04", "throughput": 5672.32, "total_tokens": 15657112} {"current_steps": 23985, "total_steps": 33920, "loss": 0.3375, "lr": 2.3938276088143003e-06, "epoch": 14.142099056603774, "percentage": 70.71, "elapsed_time": "0:46:00", "remaining_time": "0:19:03", "throughput": 5672.39, "total_tokens": 15660632} {"current_steps": 23990, "total_steps": 33920, "loss": 0.4826, "lr": 2.391632364930849e-06, "epoch": 14.14504716981132, "percentage": 70.73, "elapsed_time": "0:46:01", "remaining_time": "0:19:02", "throughput": 5672.26, "total_tokens": 15663064} {"current_steps": 23995, "total_steps": 33920, "loss": 0.357, "lr": 2.3894378116239706e-06, "epoch": 14.147995283018869, "percentage": 70.74, "elapsed_time": "0:46:01", "remaining_time": "0:19:02", "throughput": 5672.33, "total_tokens": 15666168} {"current_steps": 24000, "total_steps": 33920, "loss": 0.5006, "lr": 2.387243949474683e-06, "epoch": 14.150943396226415, "percentage": 70.75, "elapsed_time": "0:46:02", "remaining_time": "0:19:01", "throughput": 5672.46, "total_tokens": 15669528} {"current_steps": 24005, "total_steps": 33920, "loss": 0.2869, "lr": 2.38505077906382e-06, "epoch": 14.153891509433961, "percentage": 70.77, "elapsed_time": "0:46:02", "remaining_time": "0:19:01", "throughput": 5672.51, "total_tokens": 15673016} {"current_steps": 24010, "total_steps": 33920, "loss": 0.2432, "lr": 2.382858300972031e-06, "epoch": 14.15683962264151, "percentage": 70.78, "elapsed_time": "0:46:03", "remaining_time": "0:19:00", "throughput": 5672.7, "total_tokens": 15676696} {"current_steps": 24015, "total_steps": 33920, "loss": 0.4, "lr": 2.380666515779788e-06, "epoch": 14.159787735849056, "percentage": 70.8, "elapsed_time": "0:46:04", "remaining_time": "0:19:00", "throughput": 5672.81, "total_tokens": 15680600} {"current_steps": 24020, "total_steps": 33920, "loss": 0.2617, "lr": 2.3784754240673734e-06, "epoch": 14.162735849056604, "percentage": 70.81, "elapsed_time": "0:46:04", "remaining_time": "0:18:59", "throughput": 5672.88, "total_tokens": 15683800} {"current_steps": 24025, "total_steps": 33920, "loss": 0.3724, "lr": 2.3762850264148883e-06, "epoch": 14.16568396226415, "percentage": 70.83, "elapsed_time": "0:46:05", "remaining_time": "0:18:58", "throughput": 5672.81, "total_tokens": 15686616} {"current_steps": 24030, "total_steps": 33920, "loss": 0.2792, "lr": 2.374095323402251e-06, "epoch": 14.168632075471699, "percentage": 70.84, "elapsed_time": "0:46:05", "remaining_time": "0:18:58", "throughput": 5673.04, "total_tokens": 15690872} {"current_steps": 24035, "total_steps": 33920, "loss": 0.3147, "lr": 2.371906315609193e-06, "epoch": 14.171580188679245, "percentage": 70.86, "elapsed_time": "0:46:06", "remaining_time": "0:18:57", "throughput": 5673.07, "total_tokens": 15694104} {"current_steps": 24040, "total_steps": 33920, "loss": 0.4198, "lr": 2.369718003615263e-06, "epoch": 14.174528301886792, "percentage": 70.87, "elapsed_time": "0:46:06", "remaining_time": "0:18:57", "throughput": 5673.13, "total_tokens": 15697496} {"current_steps": 24045, "total_steps": 33920, "loss": 0.3282, "lr": 2.3675303879998284e-06, "epoch": 14.17747641509434, "percentage": 70.89, "elapsed_time": "0:46:07", "remaining_time": "0:18:56", "throughput": 5673.23, "total_tokens": 15701016} {"current_steps": 24050, "total_steps": 33920, "loss": 0.4184, "lr": 2.365343469342068e-06, "epoch": 14.180424528301886, "percentage": 70.9, "elapsed_time": "0:46:08", "remaining_time": "0:18:55", "throughput": 5673.11, "total_tokens": 15703512} {"current_steps": 24055, "total_steps": 33920, "loss": 0.2672, "lr": 2.3631572482209803e-06, "epoch": 14.183372641509434, "percentage": 70.92, "elapsed_time": "0:46:08", "remaining_time": "0:18:55", "throughput": 5673.23, "total_tokens": 15706936} {"current_steps": 24060, "total_steps": 33920, "loss": 0.3647, "lr": 2.3609717252153752e-06, "epoch": 14.18632075471698, "percentage": 70.93, "elapsed_time": "0:46:09", "remaining_time": "0:18:54", "throughput": 5673.06, "total_tokens": 15709560} {"current_steps": 24065, "total_steps": 33920, "loss": 0.3087, "lr": 2.35878690090388e-06, "epoch": 14.189268867924529, "percentage": 70.95, "elapsed_time": "0:46:09", "remaining_time": "0:18:54", "throughput": 5673.09, "total_tokens": 15712632} {"current_steps": 24070, "total_steps": 33920, "loss": 0.3228, "lr": 2.356602775864935e-06, "epoch": 14.192216981132075, "percentage": 70.96, "elapsed_time": "0:46:10", "remaining_time": "0:18:53", "throughput": 5673.14, "total_tokens": 15715800} {"current_steps": 24075, "total_steps": 33920, "loss": 0.348, "lr": 2.354419350676796e-06, "epoch": 14.195165094339623, "percentage": 70.98, "elapsed_time": "0:46:10", "remaining_time": "0:18:53", "throughput": 5673.14, "total_tokens": 15718936} {"current_steps": 24080, "total_steps": 33920, "loss": 0.2849, "lr": 2.3522366259175377e-06, "epoch": 14.19811320754717, "percentage": 70.99, "elapsed_time": "0:46:11", "remaining_time": "0:18:52", "throughput": 5673.18, "total_tokens": 15722072} {"current_steps": 24085, "total_steps": 33920, "loss": 0.3787, "lr": 2.350054602165044e-06, "epoch": 14.201061320754716, "percentage": 71.01, "elapsed_time": "0:46:11", "remaining_time": "0:18:51", "throughput": 5673.4, "total_tokens": 15726008} {"current_steps": 24090, "total_steps": 33920, "loss": 0.2859, "lr": 2.3478732799970143e-06, "epoch": 14.204009433962264, "percentage": 71.02, "elapsed_time": "0:46:12", "remaining_time": "0:18:51", "throughput": 5673.23, "total_tokens": 15728504} {"current_steps": 24095, "total_steps": 33920, "loss": 0.381, "lr": 2.3456926599909646e-06, "epoch": 14.20695754716981, "percentage": 71.03, "elapsed_time": "0:46:12", "remaining_time": "0:18:50", "throughput": 5673.27, "total_tokens": 15731768} {"current_steps": 24100, "total_steps": 33920, "loss": 0.3961, "lr": 2.343512742724222e-06, "epoch": 14.209905660377359, "percentage": 71.05, "elapsed_time": "0:46:13", "remaining_time": "0:18:50", "throughput": 5673.38, "total_tokens": 15735416} {"current_steps": 24105, "total_steps": 33920, "loss": 0.3129, "lr": 2.341333528773928e-06, "epoch": 14.212853773584905, "percentage": 71.06, "elapsed_time": "0:46:14", "remaining_time": "0:18:49", "throughput": 5673.6, "total_tokens": 15739896} {"current_steps": 24110, "total_steps": 33920, "loss": 0.3178, "lr": 2.3391550187170427e-06, "epoch": 14.215801886792454, "percentage": 71.08, "elapsed_time": "0:46:14", "remaining_time": "0:18:49", "throughput": 5673.57, "total_tokens": 15742712} {"current_steps": 24115, "total_steps": 33920, "loss": 0.3548, "lr": 2.336977213130333e-06, "epoch": 14.21875, "percentage": 71.09, "elapsed_time": "0:46:15", "remaining_time": "0:18:48", "throughput": 5673.52, "total_tokens": 15745528} {"current_steps": 24120, "total_steps": 33920, "loss": 0.4504, "lr": 2.3348001125903837e-06, "epoch": 14.221698113207546, "percentage": 71.11, "elapsed_time": "0:46:15", "remaining_time": "0:18:47", "throughput": 5673.52, "total_tokens": 15748536} {"current_steps": 24125, "total_steps": 33920, "loss": 0.2631, "lr": 2.3326237176735905e-06, "epoch": 14.224646226415095, "percentage": 71.12, "elapsed_time": "0:46:16", "remaining_time": "0:18:47", "throughput": 5673.34, "total_tokens": 15751000} {"current_steps": 24130, "total_steps": 33920, "loss": 0.2291, "lr": 2.330448028956164e-06, "epoch": 14.227594339622641, "percentage": 71.14, "elapsed_time": "0:46:16", "remaining_time": "0:18:46", "throughput": 5673.5, "total_tokens": 15754904} {"current_steps": 24135, "total_steps": 33920, "loss": 0.3708, "lr": 2.3282730470141255e-06, "epoch": 14.23054245283019, "percentage": 71.15, "elapsed_time": "0:46:17", "remaining_time": "0:18:46", "throughput": 5673.5, "total_tokens": 15757912} {"current_steps": 24140, "total_steps": 33920, "loss": 0.4114, "lr": 2.3260987724233143e-06, "epoch": 14.233490566037736, "percentage": 71.17, "elapsed_time": "0:46:17", "remaining_time": "0:18:45", "throughput": 5673.46, "total_tokens": 15760792} {"current_steps": 24145, "total_steps": 33920, "loss": 0.3103, "lr": 2.323925205759374e-06, "epoch": 14.236438679245284, "percentage": 71.18, "elapsed_time": "0:46:18", "remaining_time": "0:18:44", "throughput": 5673.4, "total_tokens": 15763704} {"current_steps": 24150, "total_steps": 33920, "loss": 0.3204, "lr": 2.3217523475977715e-06, "epoch": 14.23938679245283, "percentage": 71.2, "elapsed_time": "0:46:19", "remaining_time": "0:18:44", "throughput": 5673.44, "total_tokens": 15767128} {"current_steps": 24155, "total_steps": 33920, "loss": 0.4223, "lr": 2.3195801985137773e-06, "epoch": 14.242334905660377, "percentage": 71.21, "elapsed_time": "0:46:19", "remaining_time": "0:18:43", "throughput": 5673.65, "total_tokens": 15770904} {"current_steps": 24160, "total_steps": 33920, "loss": 0.2677, "lr": 2.317408759082478e-06, "epoch": 14.245283018867925, "percentage": 71.23, "elapsed_time": "0:46:20", "remaining_time": "0:18:43", "throughput": 5673.55, "total_tokens": 15773528} {"current_steps": 24165, "total_steps": 33920, "loss": 0.2553, "lr": 2.31523802987877e-06, "epoch": 14.248231132075471, "percentage": 71.24, "elapsed_time": "0:46:20", "remaining_time": "0:18:42", "throughput": 5673.47, "total_tokens": 15776312} {"current_steps": 24170, "total_steps": 33920, "loss": 0.3026, "lr": 2.3130680114773637e-06, "epoch": 14.25117924528302, "percentage": 71.26, "elapsed_time": "0:46:21", "remaining_time": "0:18:41", "throughput": 5673.18, "total_tokens": 15778680} {"current_steps": 24175, "total_steps": 33920, "loss": 0.3387, "lr": 2.310898704452782e-06, "epoch": 14.254127358490566, "percentage": 71.27, "elapsed_time": "0:46:21", "remaining_time": "0:18:41", "throughput": 5673.22, "total_tokens": 15782072} {"current_steps": 24180, "total_steps": 33920, "loss": 0.2779, "lr": 2.3087301093793584e-06, "epoch": 14.257075471698114, "percentage": 71.29, "elapsed_time": "0:46:22", "remaining_time": "0:18:40", "throughput": 5673.08, "total_tokens": 15784856} {"current_steps": 24185, "total_steps": 33920, "loss": 0.3186, "lr": 2.306562226831237e-06, "epoch": 14.26002358490566, "percentage": 71.3, "elapsed_time": "0:46:22", "remaining_time": "0:18:40", "throughput": 5673.14, "total_tokens": 15788024} {"current_steps": 24190, "total_steps": 33920, "loss": 0.2294, "lr": 2.304395057382374e-06, "epoch": 14.262971698113208, "percentage": 71.31, "elapsed_time": "0:46:23", "remaining_time": "0:18:39", "throughput": 5673.04, "total_tokens": 15790648} {"current_steps": 24195, "total_steps": 33920, "loss": 0.3453, "lr": 2.3022286016065354e-06, "epoch": 14.265919811320755, "percentage": 71.33, "elapsed_time": "0:46:23", "remaining_time": "0:18:38", "throughput": 5673.05, "total_tokens": 15793656} {"current_steps": 24200, "total_steps": 33920, "loss": 0.2681, "lr": 2.300062860077303e-06, "epoch": 14.268867924528301, "percentage": 71.34, "elapsed_time": "0:46:24", "remaining_time": "0:18:38", "throughput": 5672.98, "total_tokens": 15796248} {"current_steps": 24205, "total_steps": 33920, "loss": 0.3628, "lr": 2.297897833368064e-06, "epoch": 14.27181603773585, "percentage": 71.36, "elapsed_time": "0:46:25", "remaining_time": "0:18:37", "throughput": 5672.93, "total_tokens": 15799192} {"current_steps": 24210, "total_steps": 33920, "loss": 0.3291, "lr": 2.2957335220520194e-06, "epoch": 14.274764150943396, "percentage": 71.37, "elapsed_time": "0:46:25", "remaining_time": "0:18:37", "throughput": 5672.69, "total_tokens": 15801496} {"current_steps": 24215, "total_steps": 33920, "loss": 0.2567, "lr": 2.293569926702179e-06, "epoch": 14.277712264150944, "percentage": 71.39, "elapsed_time": "0:46:26", "remaining_time": "0:18:36", "throughput": 5672.91, "total_tokens": 15806520} {"current_steps": 24220, "total_steps": 33920, "loss": 0.3222, "lr": 2.291407047891366e-06, "epoch": 14.28066037735849, "percentage": 71.4, "elapsed_time": "0:46:26", "remaining_time": "0:18:36", "throughput": 5673.03, "total_tokens": 15810584} {"current_steps": 24225, "total_steps": 33920, "loss": 0.3436, "lr": 2.2892448861922075e-06, "epoch": 14.283608490566039, "percentage": 71.42, "elapsed_time": "0:46:27", "remaining_time": "0:18:35", "throughput": 5673.15, "total_tokens": 15814072} {"current_steps": 24230, "total_steps": 33920, "loss": 0.3707, "lr": 2.2870834421771505e-06, "epoch": 14.286556603773585, "percentage": 71.43, "elapsed_time": "0:46:28", "remaining_time": "0:18:34", "throughput": 5673.09, "total_tokens": 15816984} {"current_steps": 24235, "total_steps": 33920, "loss": 0.313, "lr": 2.2849227164184433e-06, "epoch": 14.289504716981131, "percentage": 71.45, "elapsed_time": "0:46:28", "remaining_time": "0:18:34", "throughput": 5673.15, "total_tokens": 15820280} {"current_steps": 24240, "total_steps": 33920, "loss": 0.4984, "lr": 2.2827627094881473e-06, "epoch": 14.29245283018868, "percentage": 71.46, "elapsed_time": "0:46:29", "remaining_time": "0:18:33", "throughput": 5673.55, "total_tokens": 15826072} {"current_steps": 24245, "total_steps": 33920, "loss": 0.2882, "lr": 2.2806034219581364e-06, "epoch": 14.295400943396226, "percentage": 71.48, "elapsed_time": "0:46:30", "remaining_time": "0:18:33", "throughput": 5673.86, "total_tokens": 15831416} {"current_steps": 24250, "total_steps": 33920, "loss": 0.4109, "lr": 2.278444854400089e-06, "epoch": 14.298349056603774, "percentage": 71.49, "elapsed_time": "0:46:30", "remaining_time": "0:18:32", "throughput": 5673.82, "total_tokens": 15834200} {"current_steps": 24255, "total_steps": 33920, "loss": 0.3489, "lr": 2.276287007385496e-06, "epoch": 14.30129716981132, "percentage": 71.51, "elapsed_time": "0:46:31", "remaining_time": "0:18:32", "throughput": 5673.83, "total_tokens": 15837016} {"current_steps": 24260, "total_steps": 33920, "loss": 0.2863, "lr": 2.2741298814856542e-06, "epoch": 14.304245283018869, "percentage": 71.52, "elapsed_time": "0:46:31", "remaining_time": "0:18:31", "throughput": 5673.96, "total_tokens": 15840760} {"current_steps": 24265, "total_steps": 33920, "loss": 0.2631, "lr": 2.2719734772716763e-06, "epoch": 14.307193396226415, "percentage": 71.54, "elapsed_time": "0:46:32", "remaining_time": "0:18:31", "throughput": 5673.94, "total_tokens": 15844184} {"current_steps": 24270, "total_steps": 33920, "loss": 0.3773, "lr": 2.269817795314477e-06, "epoch": 14.310141509433961, "percentage": 71.55, "elapsed_time": "0:46:33", "remaining_time": "0:18:30", "throughput": 5674.21, "total_tokens": 15848760} {"current_steps": 24275, "total_steps": 33920, "loss": 0.2671, "lr": 2.2676628361847834e-06, "epoch": 14.31308962264151, "percentage": 71.57, "elapsed_time": "0:46:33", "remaining_time": "0:18:29", "throughput": 5674.32, "total_tokens": 15851960} {"current_steps": 24280, "total_steps": 33920, "loss": 0.3662, "lr": 2.2655086004531296e-06, "epoch": 14.316037735849056, "percentage": 71.58, "elapsed_time": "0:46:34", "remaining_time": "0:18:29", "throughput": 5674.49, "total_tokens": 15855960} {"current_steps": 24285, "total_steps": 33920, "loss": 0.3505, "lr": 2.2633550886898583e-06, "epoch": 14.318985849056604, "percentage": 71.59, "elapsed_time": "0:46:34", "remaining_time": "0:18:28", "throughput": 5674.42, "total_tokens": 15858744} {"current_steps": 24290, "total_steps": 33920, "loss": 0.3486, "lr": 2.26120230146512e-06, "epoch": 14.32193396226415, "percentage": 71.61, "elapsed_time": "0:46:35", "remaining_time": "0:18:28", "throughput": 5674.43, "total_tokens": 15861752} {"current_steps": 24295, "total_steps": 33920, "loss": 0.3813, "lr": 2.2590502393488777e-06, "epoch": 14.324882075471699, "percentage": 71.62, "elapsed_time": "0:46:35", "remaining_time": "0:18:27", "throughput": 5674.61, "total_tokens": 15865784} {"current_steps": 24300, "total_steps": 33920, "loss": 0.3559, "lr": 2.256898902910898e-06, "epoch": 14.327830188679245, "percentage": 71.64, "elapsed_time": "0:46:36", "remaining_time": "0:18:27", "throughput": 5674.5, "total_tokens": 15868280} {"current_steps": 24305, "total_steps": 33920, "loss": 0.3393, "lr": 2.2547482927207548e-06, "epoch": 14.330778301886792, "percentage": 71.65, "elapsed_time": "0:46:36", "remaining_time": "0:18:26", "throughput": 5674.59, "total_tokens": 15871672} {"current_steps": 24310, "total_steps": 33920, "loss": 0.3198, "lr": 2.252598409347833e-06, "epoch": 14.33372641509434, "percentage": 71.67, "elapsed_time": "0:46:37", "remaining_time": "0:18:25", "throughput": 5674.51, "total_tokens": 15874840} {"current_steps": 24315, "total_steps": 33920, "loss": 0.3886, "lr": 2.250449253361323e-06, "epoch": 14.336674528301886, "percentage": 71.68, "elapsed_time": "0:46:38", "remaining_time": "0:18:25", "throughput": 5674.58, "total_tokens": 15878264} {"current_steps": 24320, "total_steps": 33920, "loss": 0.3586, "lr": 2.2483008253302214e-06, "epoch": 14.339622641509434, "percentage": 71.7, "elapsed_time": "0:46:38", "remaining_time": "0:18:24", "throughput": 5674.53, "total_tokens": 15881528} {"current_steps": 24325, "total_steps": 33920, "loss": 0.3412, "lr": 2.246153125823337e-06, "epoch": 14.34257075471698, "percentage": 71.71, "elapsed_time": "0:46:39", "remaining_time": "0:18:24", "throughput": 5674.68, "total_tokens": 15885304} {"current_steps": 24330, "total_steps": 33920, "loss": 0.4714, "lr": 2.2440061554092813e-06, "epoch": 14.345518867924529, "percentage": 71.73, "elapsed_time": "0:46:39", "remaining_time": "0:18:23", "throughput": 5674.62, "total_tokens": 15888408} {"current_steps": 24335, "total_steps": 33920, "loss": 0.2547, "lr": 2.2418599146564714e-06, "epoch": 14.348466981132075, "percentage": 71.74, "elapsed_time": "0:46:40", "remaining_time": "0:18:23", "throughput": 5674.71, "total_tokens": 15892280} {"current_steps": 24340, "total_steps": 33920, "loss": 0.2886, "lr": 2.239714404133138e-06, "epoch": 14.351415094339623, "percentage": 71.76, "elapsed_time": "0:46:41", "remaining_time": "0:18:22", "throughput": 5674.64, "total_tokens": 15895064} {"current_steps": 24345, "total_steps": 33920, "loss": 0.3512, "lr": 2.2375696244073126e-06, "epoch": 14.35436320754717, "percentage": 71.77, "elapsed_time": "0:46:41", "remaining_time": "0:18:21", "throughput": 5674.71, "total_tokens": 15898232} {"current_steps": 24350, "total_steps": 33920, "loss": 0.3115, "lr": 2.235425576046834e-06, "epoch": 14.357311320754716, "percentage": 71.79, "elapsed_time": "0:46:42", "remaining_time": "0:18:21", "throughput": 5674.48, "total_tokens": 15900472} {"current_steps": 24355, "total_steps": 33920, "loss": 0.33, "lr": 2.233282259619347e-06, "epoch": 14.360259433962264, "percentage": 71.8, "elapsed_time": "0:46:42", "remaining_time": "0:18:20", "throughput": 5674.28, "total_tokens": 15902808} {"current_steps": 24360, "total_steps": 33920, "loss": 0.3507, "lr": 2.231139675692308e-06, "epoch": 14.36320754716981, "percentage": 71.82, "elapsed_time": "0:46:43", "remaining_time": "0:18:20", "throughput": 5674.36, "total_tokens": 15906136} {"current_steps": 24365, "total_steps": 33920, "loss": 0.372, "lr": 2.228997824832973e-06, "epoch": 14.366155660377359, "percentage": 71.83, "elapsed_time": "0:46:44", "remaining_time": "0:18:19", "throughput": 5674.68, "total_tokens": 15912728} {"current_steps": 24370, "total_steps": 33920, "loss": 0.2313, "lr": 2.226856707608406e-06, "epoch": 14.369103773584905, "percentage": 71.85, "elapsed_time": "0:46:44", "remaining_time": "0:18:19", "throughput": 5674.9, "total_tokens": 15917016} {"current_steps": 24375, "total_steps": 33920, "loss": 0.3072, "lr": 2.2247163245854768e-06, "epoch": 14.372051886792454, "percentage": 71.86, "elapsed_time": "0:46:45", "remaining_time": "0:18:18", "throughput": 5674.67, "total_tokens": 15919128} {"current_steps": 24380, "total_steps": 33920, "loss": 0.3135, "lr": 2.222576676330862e-06, "epoch": 14.375, "percentage": 71.88, "elapsed_time": "0:46:45", "remaining_time": "0:18:17", "throughput": 5674.58, "total_tokens": 15921752} {"current_steps": 24385, "total_steps": 33920, "loss": 0.3074, "lr": 2.2204377634110403e-06, "epoch": 14.377948113207546, "percentage": 71.89, "elapsed_time": "0:46:46", "remaining_time": "0:18:17", "throughput": 5674.77, "total_tokens": 15925784} {"current_steps": 24390, "total_steps": 33920, "loss": 0.3555, "lr": 2.218299586392301e-06, "epoch": 14.380896226415095, "percentage": 71.9, "elapsed_time": "0:46:46", "remaining_time": "0:18:16", "throughput": 5674.74, "total_tokens": 15928632} {"current_steps": 24395, "total_steps": 33920, "loss": 0.3114, "lr": 2.2161621458407355e-06, "epoch": 14.383844339622641, "percentage": 71.92, "elapsed_time": "0:46:47", "remaining_time": "0:18:16", "throughput": 5674.87, "total_tokens": 15932216} {"current_steps": 24400, "total_steps": 33920, "loss": 0.3, "lr": 2.2140254423222398e-06, "epoch": 14.38679245283019, "percentage": 71.93, "elapsed_time": "0:46:48", "remaining_time": "0:18:15", "throughput": 5675.0, "total_tokens": 15935800} {"current_steps": 24405, "total_steps": 33920, "loss": 0.2226, "lr": 2.2118894764025146e-06, "epoch": 14.389740566037736, "percentage": 71.95, "elapsed_time": "0:46:48", "remaining_time": "0:18:15", "throughput": 5674.93, "total_tokens": 15938520} {"current_steps": 24410, "total_steps": 33920, "loss": 0.3389, "lr": 2.2097542486470667e-06, "epoch": 14.392688679245284, "percentage": 71.96, "elapsed_time": "0:46:49", "remaining_time": "0:18:14", "throughput": 5675.05, "total_tokens": 15941752} {"current_steps": 24415, "total_steps": 33920, "loss": 0.3444, "lr": 2.207619759621205e-06, "epoch": 14.39563679245283, "percentage": 71.98, "elapsed_time": "0:46:49", "remaining_time": "0:18:13", "throughput": 5675.17, "total_tokens": 15945272} {"current_steps": 24420, "total_steps": 33920, "loss": 0.3377, "lr": 2.205486009890049e-06, "epoch": 14.398584905660377, "percentage": 71.99, "elapsed_time": "0:46:50", "remaining_time": "0:18:13", "throughput": 5675.32, "total_tokens": 15948952} {"current_steps": 24425, "total_steps": 33920, "loss": 0.2825, "lr": 2.2033530000185146e-06, "epoch": 14.401533018867925, "percentage": 72.01, "elapsed_time": "0:46:51", "remaining_time": "0:18:12", "throughput": 5675.51, "total_tokens": 15954680} {"current_steps": 24430, "total_steps": 33920, "loss": 0.3256, "lr": 2.2012207305713244e-06, "epoch": 14.404481132075471, "percentage": 72.02, "elapsed_time": "0:46:51", "remaining_time": "0:18:12", "throughput": 5675.27, "total_tokens": 15956984} {"current_steps": 24435, "total_steps": 33920, "loss": 0.3601, "lr": 2.19908920211301e-06, "epoch": 14.40742924528302, "percentage": 72.04, "elapsed_time": "0:46:52", "remaining_time": "0:18:11", "throughput": 5675.3, "total_tokens": 15959960} {"current_steps": 24440, "total_steps": 33920, "loss": 0.2407, "lr": 2.196958415207901e-06, "epoch": 14.410377358490566, "percentage": 72.05, "elapsed_time": "0:46:52", "remaining_time": "0:18:11", "throughput": 5675.32, "total_tokens": 15963416} {"current_steps": 24445, "total_steps": 33920, "loss": 0.3438, "lr": 2.1948283704201312e-06, "epoch": 14.413325471698114, "percentage": 72.07, "elapsed_time": "0:46:53", "remaining_time": "0:18:10", "throughput": 5675.3, "total_tokens": 15966488} {"current_steps": 24450, "total_steps": 33920, "loss": 0.3504, "lr": 2.1926990683136383e-06, "epoch": 14.41627358490566, "percentage": 72.08, "elapsed_time": "0:46:53", "remaining_time": "0:18:09", "throughput": 5675.39, "total_tokens": 15969784} {"current_steps": 24455, "total_steps": 33920, "loss": 0.3158, "lr": 2.1905705094521685e-06, "epoch": 14.419221698113208, "percentage": 72.1, "elapsed_time": "0:46:54", "remaining_time": "0:18:09", "throughput": 5675.38, "total_tokens": 15972696} {"current_steps": 24460, "total_steps": 33920, "loss": 0.3193, "lr": 2.1884426943992635e-06, "epoch": 14.422169811320755, "percentage": 72.11, "elapsed_time": "0:46:54", "remaining_time": "0:18:08", "throughput": 5675.48, "total_tokens": 15975832} {"current_steps": 24465, "total_steps": 33920, "loss": 0.3011, "lr": 2.1863156237182727e-06, "epoch": 14.425117924528301, "percentage": 72.13, "elapsed_time": "0:46:55", "remaining_time": "0:18:08", "throughput": 5675.47, "total_tokens": 15978936} {"current_steps": 24470, "total_steps": 33920, "loss": 0.2822, "lr": 2.1841892979723466e-06, "epoch": 14.42806603773585, "percentage": 72.14, "elapsed_time": "0:46:56", "remaining_time": "0:18:07", "throughput": 5675.32, "total_tokens": 15981752} {"current_steps": 24475, "total_steps": 33920, "loss": 0.3454, "lr": 2.1820637177244375e-06, "epoch": 14.431014150943396, "percentage": 72.16, "elapsed_time": "0:46:56", "remaining_time": "0:18:06", "throughput": 5675.18, "total_tokens": 15984536} {"current_steps": 24480, "total_steps": 33920, "loss": 0.2998, "lr": 2.179938883537306e-06, "epoch": 14.433962264150944, "percentage": 72.17, "elapsed_time": "0:46:57", "remaining_time": "0:18:06", "throughput": 5674.98, "total_tokens": 15987288} {"current_steps": 24485, "total_steps": 33920, "loss": 0.3096, "lr": 2.177814795973508e-06, "epoch": 14.43691037735849, "percentage": 72.18, "elapsed_time": "0:46:57", "remaining_time": "0:18:05", "throughput": 5675.11, "total_tokens": 15990840} {"current_steps": 24490, "total_steps": 33920, "loss": 0.2668, "lr": 2.1756914555954064e-06, "epoch": 14.439858490566039, "percentage": 72.2, "elapsed_time": "0:46:58", "remaining_time": "0:18:05", "throughput": 5675.11, "total_tokens": 15994424} {"current_steps": 24495, "total_steps": 33920, "loss": 0.2608, "lr": 2.173568862965164e-06, "epoch": 14.442806603773585, "percentage": 72.21, "elapsed_time": "0:46:58", "remaining_time": "0:18:04", "throughput": 5675.1, "total_tokens": 15997880} {"current_steps": 24500, "total_steps": 33920, "loss": 0.5477, "lr": 2.171447018644746e-06, "epoch": 14.445754716981131, "percentage": 72.23, "elapsed_time": "0:46:59", "remaining_time": "0:18:04", "throughput": 5674.99, "total_tokens": 16000472} {"current_steps": 24505, "total_steps": 33920, "loss": 0.3466, "lr": 2.1693259231959186e-06, "epoch": 14.44870283018868, "percentage": 72.24, "elapsed_time": "0:46:59", "remaining_time": "0:18:03", "throughput": 5675.01, "total_tokens": 16003512} {"current_steps": 24510, "total_steps": 33920, "loss": 0.3931, "lr": 2.1672055771802545e-06, "epoch": 14.451650943396226, "percentage": 72.26, "elapsed_time": "0:47:00", "remaining_time": "0:18:02", "throughput": 5675.04, "total_tokens": 16006520} {"current_steps": 24515, "total_steps": 33920, "loss": 0.265, "lr": 2.1650859811591224e-06, "epoch": 14.454599056603774, "percentage": 72.27, "elapsed_time": "0:47:01", "remaining_time": "0:18:02", "throughput": 5675.13, "total_tokens": 16009592} {"current_steps": 24520, "total_steps": 33920, "loss": 0.3259, "lr": 2.1629671356936943e-06, "epoch": 14.45754716981132, "percentage": 72.29, "elapsed_time": "0:47:01", "remaining_time": "0:18:01", "throughput": 5675.24, "total_tokens": 16013656} {"current_steps": 24525, "total_steps": 33920, "loss": 0.2691, "lr": 2.1608490413449428e-06, "epoch": 14.460495283018869, "percentage": 72.3, "elapsed_time": "0:47:02", "remaining_time": "0:18:01", "throughput": 5675.28, "total_tokens": 16016856} {"current_steps": 24530, "total_steps": 33920, "loss": 0.3788, "lr": 2.158731698673645e-06, "epoch": 14.463443396226415, "percentage": 72.32, "elapsed_time": "0:47:02", "remaining_time": "0:18:00", "throughput": 5675.15, "total_tokens": 16019256} {"current_steps": 24535, "total_steps": 33920, "loss": 0.2687, "lr": 2.1566151082403752e-06, "epoch": 14.466391509433961, "percentage": 72.33, "elapsed_time": "0:47:03", "remaining_time": "0:17:59", "throughput": 5675.14, "total_tokens": 16022104} {"current_steps": 24540, "total_steps": 33920, "loss": 0.2921, "lr": 2.154499270605508e-06, "epoch": 14.46933962264151, "percentage": 72.35, "elapsed_time": "0:47:03", "remaining_time": "0:17:59", "throughput": 5675.04, "total_tokens": 16025112} {"current_steps": 24545, "total_steps": 33920, "loss": 0.3586, "lr": 2.1523841863292243e-06, "epoch": 14.472287735849056, "percentage": 72.36, "elapsed_time": "0:47:04", "remaining_time": "0:17:58", "throughput": 5674.9, "total_tokens": 16028088} {"current_steps": 24550, "total_steps": 33920, "loss": 0.3377, "lr": 2.1502698559714998e-06, "epoch": 14.475235849056604, "percentage": 72.38, "elapsed_time": "0:47:04", "remaining_time": "0:17:58", "throughput": 5675.02, "total_tokens": 16031640} {"current_steps": 24555, "total_steps": 33920, "loss": 0.3389, "lr": 2.1481562800921125e-06, "epoch": 14.47818396226415, "percentage": 72.39, "elapsed_time": "0:47:05", "remaining_time": "0:17:57", "throughput": 5675.1, "total_tokens": 16035064} {"current_steps": 24560, "total_steps": 33920, "loss": 0.3088, "lr": 2.146043459250641e-06, "epoch": 14.481132075471699, "percentage": 72.41, "elapsed_time": "0:47:06", "remaining_time": "0:17:57", "throughput": 5675.01, "total_tokens": 16037848} {"current_steps": 24565, "total_steps": 33920, "loss": 0.3072, "lr": 2.1439313940064634e-06, "epoch": 14.484080188679245, "percentage": 72.42, "elapsed_time": "0:47:06", "remaining_time": "0:17:56", "throughput": 5675.08, "total_tokens": 16041432} {"current_steps": 24570, "total_steps": 33920, "loss": 0.3589, "lr": 2.141820084918756e-06, "epoch": 14.487028301886792, "percentage": 72.44, "elapsed_time": "0:47:07", "remaining_time": "0:17:55", "throughput": 5675.25, "total_tokens": 16045656} {"current_steps": 24575, "total_steps": 33920, "loss": 0.3401, "lr": 2.1397095325465013e-06, "epoch": 14.48997641509434, "percentage": 72.45, "elapsed_time": "0:47:07", "remaining_time": "0:17:55", "throughput": 5675.21, "total_tokens": 16048760} {"current_steps": 24580, "total_steps": 33920, "loss": 0.3185, "lr": 2.1375997374484754e-06, "epoch": 14.492924528301886, "percentage": 72.46, "elapsed_time": "0:47:08", "remaining_time": "0:17:54", "throughput": 5675.39, "total_tokens": 16052792} {"current_steps": 24585, "total_steps": 33920, "loss": 0.3174, "lr": 2.1354907001832546e-06, "epoch": 14.495872641509434, "percentage": 72.48, "elapsed_time": "0:47:09", "remaining_time": "0:17:54", "throughput": 5675.22, "total_tokens": 16055544} {"current_steps": 24590, "total_steps": 33920, "loss": 0.2882, "lr": 2.133382421309217e-06, "epoch": 14.49882075471698, "percentage": 72.49, "elapsed_time": "0:47:09", "remaining_time": "0:17:53", "throughput": 5675.15, "total_tokens": 16058168} {"current_steps": 24595, "total_steps": 33920, "loss": 0.3229, "lr": 2.131274901384537e-06, "epoch": 14.501768867924529, "percentage": 72.51, "elapsed_time": "0:47:10", "remaining_time": "0:17:53", "throughput": 5675.31, "total_tokens": 16062072} {"current_steps": 24600, "total_steps": 33920, "loss": 0.3107, "lr": 2.1291681409671896e-06, "epoch": 14.504716981132075, "percentage": 72.52, "elapsed_time": "0:47:10", "remaining_time": "0:17:52", "throughput": 5675.22, "total_tokens": 16064824} {"current_steps": 24605, "total_steps": 33920, "loss": 0.302, "lr": 2.12706214061495e-06, "epoch": 14.507665094339622, "percentage": 72.54, "elapsed_time": "0:47:11", "remaining_time": "0:17:51", "throughput": 5675.08, "total_tokens": 16067320} {"current_steps": 24610, "total_steps": 33920, "loss": 0.4105, "lr": 2.124956900885391e-06, "epoch": 14.51061320754717, "percentage": 72.55, "elapsed_time": "0:47:11", "remaining_time": "0:17:51", "throughput": 5675.02, "total_tokens": 16070008} {"current_steps": 24615, "total_steps": 33920, "loss": 0.2902, "lr": 2.1228524223358833e-06, "epoch": 14.513561320754716, "percentage": 72.57, "elapsed_time": "0:47:12", "remaining_time": "0:17:50", "throughput": 5674.89, "total_tokens": 16072504} {"current_steps": 24620, "total_steps": 33920, "loss": 0.3866, "lr": 2.120748705523595e-06, "epoch": 14.516509433962264, "percentage": 72.58, "elapsed_time": "0:47:12", "remaining_time": "0:17:50", "throughput": 5674.9, "total_tokens": 16075896} {"current_steps": 24625, "total_steps": 33920, "loss": 0.2418, "lr": 2.1186457510054976e-06, "epoch": 14.51945754716981, "percentage": 72.6, "elapsed_time": "0:47:13", "remaining_time": "0:17:49", "throughput": 5674.73, "total_tokens": 16078296} {"current_steps": 24630, "total_steps": 33920, "loss": 0.3203, "lr": 2.116543559338355e-06, "epoch": 14.522405660377359, "percentage": 72.61, "elapsed_time": "0:47:13", "remaining_time": "0:17:48", "throughput": 5674.61, "total_tokens": 16080792} {"current_steps": 24635, "total_steps": 33920, "loss": 0.3166, "lr": 2.1144421310787305e-06, "epoch": 14.525353773584905, "percentage": 72.63, "elapsed_time": "0:47:14", "remaining_time": "0:17:48", "throughput": 5674.73, "total_tokens": 16084152} {"current_steps": 24640, "total_steps": 33920, "loss": 0.3757, "lr": 2.11234146678299e-06, "epoch": 14.528301886792454, "percentage": 72.64, "elapsed_time": "0:47:14", "remaining_time": "0:17:47", "throughput": 5674.74, "total_tokens": 16087192} {"current_steps": 24645, "total_steps": 33920, "loss": 0.4327, "lr": 2.1102415670072907e-06, "epoch": 14.53125, "percentage": 72.66, "elapsed_time": "0:47:15", "remaining_time": "0:17:47", "throughput": 5674.8, "total_tokens": 16090392} {"current_steps": 24650, "total_steps": 33920, "loss": 0.4116, "lr": 2.108142432307591e-06, "epoch": 14.534198113207546, "percentage": 72.67, "elapsed_time": "0:47:16", "remaining_time": "0:17:46", "throughput": 5674.91, "total_tokens": 16094200} {"current_steps": 24655, "total_steps": 33920, "loss": 0.259, "lr": 2.1060440632396456e-06, "epoch": 14.537146226415095, "percentage": 72.69, "elapsed_time": "0:47:16", "remaining_time": "0:17:45", "throughput": 5675.01, "total_tokens": 16098008} {"current_steps": 24660, "total_steps": 33920, "loss": 0.2354, "lr": 2.103946460359007e-06, "epoch": 14.540094339622641, "percentage": 72.7, "elapsed_time": "0:47:17", "remaining_time": "0:17:45", "throughput": 5674.92, "total_tokens": 16100664} {"current_steps": 24665, "total_steps": 33920, "loss": 0.3667, "lr": 2.101849624221022e-06, "epoch": 14.54304245283019, "percentage": 72.72, "elapsed_time": "0:47:17", "remaining_time": "0:17:44", "throughput": 5674.86, "total_tokens": 16103384} {"current_steps": 24670, "total_steps": 33920, "loss": 0.2406, "lr": 2.0997535553808417e-06, "epoch": 14.545990566037736, "percentage": 72.73, "elapsed_time": "0:47:18", "remaining_time": "0:17:44", "throughput": 5674.88, "total_tokens": 16106488} {"current_steps": 24675, "total_steps": 33920, "loss": 0.2744, "lr": 2.0976582543934064e-06, "epoch": 14.548938679245284, "percentage": 72.74, "elapsed_time": "0:47:18", "remaining_time": "0:17:43", "throughput": 5675.09, "total_tokens": 16110360} {"current_steps": 24680, "total_steps": 33920, "loss": 0.2792, "lr": 2.0955637218134573e-06, "epoch": 14.55188679245283, "percentage": 72.76, "elapsed_time": "0:47:19", "remaining_time": "0:17:43", "throughput": 5675.22, "total_tokens": 16113880} {"current_steps": 24685, "total_steps": 33920, "loss": 0.2526, "lr": 2.09346995819553e-06, "epoch": 14.554834905660378, "percentage": 72.77, "elapsed_time": "0:47:19", "remaining_time": "0:17:42", "throughput": 5675.28, "total_tokens": 16117080} {"current_steps": 24690, "total_steps": 33920, "loss": 0.4293, "lr": 2.0913769640939553e-06, "epoch": 14.557783018867925, "percentage": 72.79, "elapsed_time": "0:47:20", "remaining_time": "0:17:41", "throughput": 5675.31, "total_tokens": 16120440} {"current_steps": 24695, "total_steps": 33920, "loss": 0.4181, "lr": 2.0892847400628674e-06, "epoch": 14.560731132075471, "percentage": 72.8, "elapsed_time": "0:47:20", "remaining_time": "0:17:41", "throughput": 5675.45, "total_tokens": 16123864} {"current_steps": 24700, "total_steps": 33920, "loss": 0.311, "lr": 2.0871932866561885e-06, "epoch": 14.56367924528302, "percentage": 72.82, "elapsed_time": "0:47:21", "remaining_time": "0:17:40", "throughput": 5675.54, "total_tokens": 16127032} {"current_steps": 24705, "total_steps": 33920, "loss": 0.301, "lr": 2.0851026044276405e-06, "epoch": 14.566627358490566, "percentage": 72.83, "elapsed_time": "0:47:22", "remaining_time": "0:17:40", "throughput": 5675.41, "total_tokens": 16129528} {"current_steps": 24710, "total_steps": 33920, "loss": 0.3594, "lr": 2.083012693930741e-06, "epoch": 14.569575471698114, "percentage": 72.85, "elapsed_time": "0:47:22", "remaining_time": "0:17:39", "throughput": 5675.11, "total_tokens": 16131864} {"current_steps": 24715, "total_steps": 33920, "loss": 0.2058, "lr": 2.0809235557188e-06, "epoch": 14.57252358490566, "percentage": 72.86, "elapsed_time": "0:47:23", "remaining_time": "0:17:38", "throughput": 5675.24, "total_tokens": 16135992} {"current_steps": 24720, "total_steps": 33920, "loss": 0.3389, "lr": 2.0788351903449307e-06, "epoch": 14.575471698113208, "percentage": 72.88, "elapsed_time": "0:47:23", "remaining_time": "0:17:38", "throughput": 5675.26, "total_tokens": 16139032} {"current_steps": 24725, "total_steps": 33920, "loss": 0.2686, "lr": 2.0767475983620317e-06, "epoch": 14.578419811320755, "percentage": 72.89, "elapsed_time": "0:47:24", "remaining_time": "0:17:37", "throughput": 5675.37, "total_tokens": 16142712} {"current_steps": 24730, "total_steps": 33920, "loss": 0.3082, "lr": 2.074660780322806e-06, "epoch": 14.581367924528301, "percentage": 72.91, "elapsed_time": "0:47:24", "remaining_time": "0:17:37", "throughput": 5675.55, "total_tokens": 16146616} {"current_steps": 24735, "total_steps": 33920, "loss": 0.3198, "lr": 2.0725747367797473e-06, "epoch": 14.58431603773585, "percentage": 72.92, "elapsed_time": "0:47:25", "remaining_time": "0:17:36", "throughput": 5675.54, "total_tokens": 16149560} {"current_steps": 24740, "total_steps": 33920, "loss": 0.3162, "lr": 2.070489468285143e-06, "epoch": 14.587264150943396, "percentage": 72.94, "elapsed_time": "0:47:26", "remaining_time": "0:17:36", "throughput": 5675.74, "total_tokens": 16153656} {"current_steps": 24745, "total_steps": 33920, "loss": 0.3303, "lr": 2.068404975391077e-06, "epoch": 14.590212264150944, "percentage": 72.95, "elapsed_time": "0:47:26", "remaining_time": "0:17:35", "throughput": 5675.83, "total_tokens": 16157464} {"current_steps": 24750, "total_steps": 33920, "loss": 0.372, "lr": 2.0663212586494293e-06, "epoch": 14.59316037735849, "percentage": 72.97, "elapsed_time": "0:47:27", "remaining_time": "0:17:34", "throughput": 5675.86, "total_tokens": 16160824} {"current_steps": 24755, "total_steps": 33920, "loss": 0.2608, "lr": 2.064238318611869e-06, "epoch": 14.596108490566039, "percentage": 72.98, "elapsed_time": "0:47:28", "remaining_time": "0:17:34", "throughput": 5675.98, "total_tokens": 16167384} {"current_steps": 24760, "total_steps": 33920, "loss": 0.2641, "lr": 2.0621561558298693e-06, "epoch": 14.599056603773585, "percentage": 73.0, "elapsed_time": "0:47:29", "remaining_time": "0:17:33", "throughput": 5676.09, "total_tokens": 16171224} {"current_steps": 24765, "total_steps": 33920, "loss": 0.293, "lr": 2.0600747708546877e-06, "epoch": 14.602004716981131, "percentage": 73.01, "elapsed_time": "0:47:29", "remaining_time": "0:17:33", "throughput": 5676.08, "total_tokens": 16174200} {"current_steps": 24770, "total_steps": 33920, "loss": 0.2646, "lr": 2.0579941642373814e-06, "epoch": 14.60495283018868, "percentage": 73.02, "elapsed_time": "0:47:30", "remaining_time": "0:17:32", "throughput": 5676.13, "total_tokens": 16177816} {"current_steps": 24775, "total_steps": 33920, "loss": 0.4378, "lr": 2.0559143365287993e-06, "epoch": 14.607900943396226, "percentage": 73.04, "elapsed_time": "0:47:30", "remaining_time": "0:17:32", "throughput": 5676.17, "total_tokens": 16180952} {"current_steps": 24780, "total_steps": 33920, "loss": 0.3841, "lr": 2.0538352882795846e-06, "epoch": 14.610849056603774, "percentage": 73.05, "elapsed_time": "0:47:31", "remaining_time": "0:17:31", "throughput": 5676.16, "total_tokens": 16184120} {"current_steps": 24785, "total_steps": 33920, "loss": 0.3101, "lr": 2.051757020040173e-06, "epoch": 14.61379716981132, "percentage": 73.07, "elapsed_time": "0:47:31", "remaining_time": "0:17:31", "throughput": 5676.13, "total_tokens": 16187000} {"current_steps": 24790, "total_steps": 33920, "loss": 0.3104, "lr": 2.0496795323607983e-06, "epoch": 14.616745283018869, "percentage": 73.08, "elapsed_time": "0:47:32", "remaining_time": "0:17:30", "throughput": 5676.1, "total_tokens": 16189720} {"current_steps": 24795, "total_steps": 33920, "loss": 0.2769, "lr": 2.0476028257914825e-06, "epoch": 14.619693396226415, "percentage": 73.1, "elapsed_time": "0:47:32", "remaining_time": "0:17:29", "throughput": 5676.18, "total_tokens": 16193112} {"current_steps": 24800, "total_steps": 33920, "loss": 0.516, "lr": 2.0455269008820433e-06, "epoch": 14.622641509433961, "percentage": 73.11, "elapsed_time": "0:47:33", "remaining_time": "0:17:29", "throughput": 5676.31, "total_tokens": 16197304} {"current_steps": 24805, "total_steps": 33920, "loss": 0.3636, "lr": 2.0434517581820893e-06, "epoch": 14.62558962264151, "percentage": 73.13, "elapsed_time": "0:47:34", "remaining_time": "0:17:28", "throughput": 5676.41, "total_tokens": 16200728} {"current_steps": 24810, "total_steps": 33920, "loss": 0.3165, "lr": 2.041377398241025e-06, "epoch": 14.628537735849056, "percentage": 73.14, "elapsed_time": "0:47:34", "remaining_time": "0:17:28", "throughput": 5676.32, "total_tokens": 16203448} {"current_steps": 24815, "total_steps": 33920, "loss": 0.3293, "lr": 2.0393038216080433e-06, "epoch": 14.631485849056604, "percentage": 73.16, "elapsed_time": "0:47:35", "remaining_time": "0:17:27", "throughput": 5676.35, "total_tokens": 16206584} {"current_steps": 24820, "total_steps": 33920, "loss": 0.5062, "lr": 2.037231028832135e-06, "epoch": 14.63443396226415, "percentage": 73.17, "elapsed_time": "0:47:35", "remaining_time": "0:17:26", "throughput": 5676.2, "total_tokens": 16208984} {"current_steps": 24825, "total_steps": 33920, "loss": 0.3864, "lr": 2.0351590204620823e-06, "epoch": 14.637382075471699, "percentage": 73.19, "elapsed_time": "0:47:36", "remaining_time": "0:17:26", "throughput": 5676.2, "total_tokens": 16211832} {"current_steps": 24830, "total_steps": 33920, "loss": 0.3588, "lr": 2.033087797046457e-06, "epoch": 14.640330188679245, "percentage": 73.2, "elapsed_time": "0:47:36", "remaining_time": "0:17:25", "throughput": 5676.29, "total_tokens": 16215160} {"current_steps": 24835, "total_steps": 33920, "loss": 0.4272, "lr": 2.031017359133624e-06, "epoch": 14.643278301886792, "percentage": 73.22, "elapsed_time": "0:47:37", "remaining_time": "0:17:25", "throughput": 5676.4, "total_tokens": 16218904} {"current_steps": 24840, "total_steps": 33920, "loss": 0.2499, "lr": 2.0289477072717406e-06, "epoch": 14.64622641509434, "percentage": 73.23, "elapsed_time": "0:47:37", "remaining_time": "0:17:24", "throughput": 5676.51, "total_tokens": 16222552} {"current_steps": 24845, "total_steps": 33920, "loss": 0.2778, "lr": 2.026878842008756e-06, "epoch": 14.649174528301886, "percentage": 73.25, "elapsed_time": "0:47:38", "remaining_time": "0:17:24", "throughput": 5676.5, "total_tokens": 16225496} {"current_steps": 24850, "total_steps": 33920, "loss": 0.3617, "lr": 2.0248107638924105e-06, "epoch": 14.652122641509434, "percentage": 73.26, "elapsed_time": "0:47:38", "remaining_time": "0:17:23", "throughput": 5676.51, "total_tokens": 16228728} {"current_steps": 24855, "total_steps": 33920, "loss": 0.3171, "lr": 2.0227434734702386e-06, "epoch": 14.65507075471698, "percentage": 73.28, "elapsed_time": "0:47:39", "remaining_time": "0:17:22", "throughput": 5676.59, "total_tokens": 16231960} {"current_steps": 24860, "total_steps": 33920, "loss": 0.3514, "lr": 2.020676971289563e-06, "epoch": 14.658018867924529, "percentage": 73.29, "elapsed_time": "0:47:40", "remaining_time": "0:17:22", "throughput": 5676.77, "total_tokens": 16236088} {"current_steps": 24865, "total_steps": 33920, "loss": 0.3923, "lr": 2.0186112578975005e-06, "epoch": 14.660966981132075, "percentage": 73.3, "elapsed_time": "0:47:40", "remaining_time": "0:17:21", "throughput": 5677.07, "total_tokens": 16241336} {"current_steps": 24870, "total_steps": 33920, "loss": 0.4374, "lr": 2.016546333840956e-06, "epoch": 14.663915094339622, "percentage": 73.32, "elapsed_time": "0:47:41", "remaining_time": "0:17:21", "throughput": 5677.03, "total_tokens": 16244088} {"current_steps": 24875, "total_steps": 33920, "loss": 0.3159, "lr": 2.014482199666627e-06, "epoch": 14.66686320754717, "percentage": 73.33, "elapsed_time": "0:47:41", "remaining_time": "0:17:20", "throughput": 5677.17, "total_tokens": 16247768} {"current_steps": 24880, "total_steps": 33920, "loss": 0.4157, "lr": 2.0124188559210017e-06, "epoch": 14.669811320754716, "percentage": 73.35, "elapsed_time": "0:47:42", "remaining_time": "0:17:20", "throughput": 5677.14, "total_tokens": 16250552} {"current_steps": 24885, "total_steps": 33920, "loss": 0.3023, "lr": 2.0103563031503613e-06, "epoch": 14.672759433962264, "percentage": 73.36, "elapsed_time": "0:47:42", "remaining_time": "0:17:19", "throughput": 5677.22, "total_tokens": 16253880} {"current_steps": 24890, "total_steps": 33920, "loss": 0.2616, "lr": 2.0082945419007745e-06, "epoch": 14.67570754716981, "percentage": 73.38, "elapsed_time": "0:47:43", "remaining_time": "0:17:18", "throughput": 5677.27, "total_tokens": 16256952} {"current_steps": 24895, "total_steps": 33920, "loss": 0.262, "lr": 2.0062335727181007e-06, "epoch": 14.678655660377359, "percentage": 73.39, "elapsed_time": "0:47:44", "remaining_time": "0:17:18", "throughput": 5677.47, "total_tokens": 16261112} {"current_steps": 24900, "total_steps": 33920, "loss": 0.2901, "lr": 2.004173396147992e-06, "epoch": 14.681603773584905, "percentage": 73.41, "elapsed_time": "0:47:44", "remaining_time": "0:17:17", "throughput": 5677.34, "total_tokens": 16263832} {"current_steps": 24905, "total_steps": 33920, "loss": 0.2831, "lr": 2.0021140127358873e-06, "epoch": 14.684551886792454, "percentage": 73.42, "elapsed_time": "0:47:45", "remaining_time": "0:17:17", "throughput": 5677.46, "total_tokens": 16267320} {"current_steps": 24910, "total_steps": 33920, "loss": 0.3113, "lr": 2.0000554230270164e-06, "epoch": 14.6875, "percentage": 73.44, "elapsed_time": "0:47:45", "remaining_time": "0:17:16", "throughput": 5677.44, "total_tokens": 16270296} {"current_steps": 24915, "total_steps": 33920, "loss": 0.2193, "lr": 1.997997627566401e-06, "epoch": 14.690448113207546, "percentage": 73.45, "elapsed_time": "0:47:46", "remaining_time": "0:17:15", "throughput": 5677.38, "total_tokens": 16273144} {"current_steps": 24920, "total_steps": 33920, "loss": 0.2916, "lr": 1.9959406268988536e-06, "epoch": 14.693396226415095, "percentage": 73.47, "elapsed_time": "0:47:46", "remaining_time": "0:17:15", "throughput": 5677.44, "total_tokens": 16276344} {"current_steps": 24925, "total_steps": 33920, "loss": 0.2714, "lr": 1.9938844215689717e-06, "epoch": 14.696344339622641, "percentage": 73.48, "elapsed_time": "0:47:47", "remaining_time": "0:17:14", "throughput": 5677.52, "total_tokens": 16279544} {"current_steps": 24930, "total_steps": 33920, "loss": 0.2246, "lr": 1.991829012121145e-06, "epoch": 14.69929245283019, "percentage": 73.5, "elapsed_time": "0:47:47", "remaining_time": "0:17:14", "throughput": 5677.62, "total_tokens": 16283128} {"current_steps": 24935, "total_steps": 33920, "loss": 0.3031, "lr": 1.989774399099552e-06, "epoch": 14.702240566037736, "percentage": 73.51, "elapsed_time": "0:47:48", "remaining_time": "0:17:13", "throughput": 5677.53, "total_tokens": 16285880} {"current_steps": 24940, "total_steps": 33920, "loss": 0.3746, "lr": 1.98772058304816e-06, "epoch": 14.705188679245284, "percentage": 73.53, "elapsed_time": "0:47:48", "remaining_time": "0:17:13", "throughput": 5677.45, "total_tokens": 16288472} {"current_steps": 24945, "total_steps": 33920, "loss": 0.4514, "lr": 1.9856675645107244e-06, "epoch": 14.70813679245283, "percentage": 73.54, "elapsed_time": "0:47:49", "remaining_time": "0:17:12", "throughput": 5677.41, "total_tokens": 16291256} {"current_steps": 24950, "total_steps": 33920, "loss": 0.2961, "lr": 1.9836153440307936e-06, "epoch": 14.711084905660378, "percentage": 73.56, "elapsed_time": "0:47:50", "remaining_time": "0:17:11", "throughput": 5677.52, "total_tokens": 16294872} {"current_steps": 24955, "total_steps": 33920, "loss": 0.269, "lr": 1.9815639221517002e-06, "epoch": 14.714033018867925, "percentage": 73.57, "elapsed_time": "0:47:50", "remaining_time": "0:17:11", "throughput": 5677.47, "total_tokens": 16297688} {"current_steps": 24960, "total_steps": 33920, "loss": 0.3559, "lr": 1.9795132994165673e-06, "epoch": 14.716981132075471, "percentage": 73.58, "elapsed_time": "0:47:51", "remaining_time": "0:17:10", "throughput": 5677.55, "total_tokens": 16301208} {"current_steps": 24965, "total_steps": 33920, "loss": 0.2998, "lr": 1.977463476368306e-06, "epoch": 14.71992924528302, "percentage": 73.6, "elapsed_time": "0:47:51", "remaining_time": "0:17:10", "throughput": 5677.46, "total_tokens": 16303736} {"current_steps": 24970, "total_steps": 33920, "loss": 0.2754, "lr": 1.975414453549614e-06, "epoch": 14.722877358490566, "percentage": 73.61, "elapsed_time": "0:47:52", "remaining_time": "0:17:09", "throughput": 5677.39, "total_tokens": 16306616} {"current_steps": 24975, "total_steps": 33920, "loss": 0.3963, "lr": 1.9733662315029826e-06, "epoch": 14.725825471698114, "percentage": 73.63, "elapsed_time": "0:47:52", "remaining_time": "0:17:08", "throughput": 5677.44, "total_tokens": 16310040} {"current_steps": 24980, "total_steps": 33920, "loss": 0.3532, "lr": 1.9713188107706856e-06, "epoch": 14.72877358490566, "percentage": 73.64, "elapsed_time": "0:47:53", "remaining_time": "0:17:08", "throughput": 5677.32, "total_tokens": 16312856} {"current_steps": 24985, "total_steps": 33920, "loss": 0.2758, "lr": 1.969272191894786e-06, "epoch": 14.731721698113208, "percentage": 73.66, "elapsed_time": "0:47:53", "remaining_time": "0:17:07", "throughput": 5677.26, "total_tokens": 16315640} {"current_steps": 24990, "total_steps": 33920, "loss": 0.297, "lr": 1.967226375417135e-06, "epoch": 14.734669811320755, "percentage": 73.67, "elapsed_time": "0:47:54", "remaining_time": "0:17:07", "throughput": 5677.3, "total_tokens": 16318680} {"current_steps": 24995, "total_steps": 33920, "loss": 0.3126, "lr": 1.965181361879372e-06, "epoch": 14.737617924528301, "percentage": 73.69, "elapsed_time": "0:47:54", "remaining_time": "0:17:06", "throughput": 5677.36, "total_tokens": 16321848} {"current_steps": 25000, "total_steps": 33920, "loss": 0.2886, "lr": 1.9631371518229214e-06, "epoch": 14.74056603773585, "percentage": 73.7, "elapsed_time": "0:47:55", "remaining_time": "0:17:05", "throughput": 5677.3, "total_tokens": 16324600} {"current_steps": 25005, "total_steps": 33920, "loss": 0.2822, "lr": 1.9610937457889975e-06, "epoch": 14.743514150943396, "percentage": 73.72, "elapsed_time": "0:47:55", "remaining_time": "0:17:05", "throughput": 5677.3, "total_tokens": 16327896} {"current_steps": 25010, "total_steps": 33920, "loss": 0.3042, "lr": 1.9590511443186032e-06, "epoch": 14.746462264150944, "percentage": 73.73, "elapsed_time": "0:47:56", "remaining_time": "0:17:04", "throughput": 5677.3, "total_tokens": 16331096} {"current_steps": 25015, "total_steps": 33920, "loss": 0.3561, "lr": 1.9570093479525243e-06, "epoch": 14.74941037735849, "percentage": 73.75, "elapsed_time": "0:47:57", "remaining_time": "0:17:04", "throughput": 5677.28, "total_tokens": 16333976} {"current_steps": 25020, "total_steps": 33920, "loss": 0.4548, "lr": 1.954968357231335e-06, "epoch": 14.752358490566039, "percentage": 73.76, "elapsed_time": "0:47:57", "remaining_time": "0:17:03", "throughput": 5677.27, "total_tokens": 16337176} {"current_steps": 25025, "total_steps": 33920, "loss": 0.3339, "lr": 1.9529281726953964e-06, "epoch": 14.755306603773585, "percentage": 73.78, "elapsed_time": "0:47:58", "remaining_time": "0:17:03", "throughput": 5677.32, "total_tokens": 16340312} {"current_steps": 25030, "total_steps": 33920, "loss": 0.3169, "lr": 1.9508887948848564e-06, "epoch": 14.758254716981131, "percentage": 73.79, "elapsed_time": "0:47:58", "remaining_time": "0:17:02", "throughput": 5677.45, "total_tokens": 16344728} {"current_steps": 25035, "total_steps": 33920, "loss": 0.2614, "lr": 1.9488502243396475e-06, "epoch": 14.76120283018868, "percentage": 73.81, "elapsed_time": "0:47:59", "remaining_time": "0:17:01", "throughput": 5677.53, "total_tokens": 16347832} {"current_steps": 25040, "total_steps": 33920, "loss": 0.2985, "lr": 1.946812461599492e-06, "epoch": 14.764150943396226, "percentage": 73.82, "elapsed_time": "0:47:59", "remaining_time": "0:17:01", "throughput": 5677.48, "total_tokens": 16350584} {"current_steps": 25045, "total_steps": 33920, "loss": 0.2169, "lr": 1.944775507203897e-06, "epoch": 14.767099056603774, "percentage": 73.84, "elapsed_time": "0:48:00", "remaining_time": "0:17:00", "throughput": 5677.55, "total_tokens": 16354104} {"current_steps": 25050, "total_steps": 33920, "loss": 0.2626, "lr": 1.942739361692153e-06, "epoch": 14.77004716981132, "percentage": 73.85, "elapsed_time": "0:48:00", "remaining_time": "0:17:00", "throughput": 5677.61, "total_tokens": 16357048} {"current_steps": 25055, "total_steps": 33920, "loss": 0.4593, "lr": 1.94070402560334e-06, "epoch": 14.772995283018869, "percentage": 73.86, "elapsed_time": "0:48:01", "remaining_time": "0:16:59", "throughput": 5677.84, "total_tokens": 16361048} {"current_steps": 25060, "total_steps": 33920, "loss": 0.2883, "lr": 1.93866949947632e-06, "epoch": 14.775943396226415, "percentage": 73.88, "elapsed_time": "0:48:02", "remaining_time": "0:16:58", "throughput": 5677.84, "total_tokens": 16363864} {"current_steps": 25065, "total_steps": 33920, "loss": 0.3646, "lr": 1.9366357838497423e-06, "epoch": 14.778891509433961, "percentage": 73.89, "elapsed_time": "0:48:02", "remaining_time": "0:16:58", "throughput": 5678.0, "total_tokens": 16367608} {"current_steps": 25070, "total_steps": 33920, "loss": 0.4128, "lr": 1.9346028792620454e-06, "epoch": 14.78183962264151, "percentage": 73.91, "elapsed_time": "0:48:03", "remaining_time": "0:16:57", "throughput": 5678.22, "total_tokens": 16371928} {"current_steps": 25075, "total_steps": 33920, "loss": 0.3401, "lr": 1.9325707862514464e-06, "epoch": 14.784787735849056, "percentage": 73.92, "elapsed_time": "0:48:03", "remaining_time": "0:16:57", "throughput": 5678.32, "total_tokens": 16375544} {"current_steps": 25080, "total_steps": 33920, "loss": 0.3298, "lr": 1.930539505355952e-06, "epoch": 14.787735849056604, "percentage": 73.94, "elapsed_time": "0:48:04", "remaining_time": "0:16:56", "throughput": 5678.35, "total_tokens": 16378648} {"current_steps": 25085, "total_steps": 33920, "loss": 0.4165, "lr": 1.9285090371133524e-06, "epoch": 14.79068396226415, "percentage": 73.95, "elapsed_time": "0:48:04", "remaining_time": "0:16:56", "throughput": 5678.45, "total_tokens": 16381880} {"current_steps": 25090, "total_steps": 33920, "loss": 0.4654, "lr": 1.9264793820612228e-06, "epoch": 14.793632075471699, "percentage": 73.97, "elapsed_time": "0:48:05", "remaining_time": "0:16:55", "throughput": 5678.61, "total_tokens": 16386296} {"current_steps": 25095, "total_steps": 33920, "loss": 0.2619, "lr": 1.924450540736921e-06, "epoch": 14.796580188679245, "percentage": 73.98, "elapsed_time": "0:48:06", "remaining_time": "0:16:54", "throughput": 5678.58, "total_tokens": 16389272} {"current_steps": 25100, "total_steps": 33920, "loss": 0.3192, "lr": 1.922422513677593e-06, "epoch": 14.799528301886792, "percentage": 74.0, "elapsed_time": "0:48:06", "remaining_time": "0:16:54", "throughput": 5678.66, "total_tokens": 16392664} {"current_steps": 25105, "total_steps": 33920, "loss": 0.4344, "lr": 1.9203953014201703e-06, "epoch": 14.80247641509434, "percentage": 74.01, "elapsed_time": "0:48:07", "remaining_time": "0:16:53", "throughput": 5678.81, "total_tokens": 16396536} {"current_steps": 25110, "total_steps": 33920, "loss": 0.2464, "lr": 1.918368904501364e-06, "epoch": 14.805424528301886, "percentage": 74.03, "elapsed_time": "0:48:07", "remaining_time": "0:16:53", "throughput": 5679.08, "total_tokens": 16400952} {"current_steps": 25115, "total_steps": 33920, "loss": 0.4455, "lr": 1.9163433234576713e-06, "epoch": 14.808372641509434, "percentage": 74.04, "elapsed_time": "0:48:08", "remaining_time": "0:16:52", "throughput": 5679.05, "total_tokens": 16403864} {"current_steps": 25120, "total_steps": 33920, "loss": 0.3224, "lr": 1.9143185588253733e-06, "epoch": 14.81132075471698, "percentage": 74.06, "elapsed_time": "0:48:08", "remaining_time": "0:16:52", "throughput": 5679.01, "total_tokens": 16406648} {"current_steps": 25125, "total_steps": 33920, "loss": 0.3417, "lr": 1.9122946111405354e-06, "epoch": 14.814268867924529, "percentage": 74.07, "elapsed_time": "0:48:09", "remaining_time": "0:16:51", "throughput": 5678.94, "total_tokens": 16409368} {"current_steps": 25130, "total_steps": 33920, "loss": 0.2512, "lr": 1.910271480939005e-06, "epoch": 14.817216981132075, "percentage": 74.09, "elapsed_time": "0:48:10", "remaining_time": "0:16:50", "throughput": 5678.79, "total_tokens": 16411832} {"current_steps": 25135, "total_steps": 33920, "loss": 0.2818, "lr": 1.9082491687564176e-06, "epoch": 14.820165094339622, "percentage": 74.1, "elapsed_time": "0:48:10", "remaining_time": "0:16:50", "throughput": 5679.02, "total_tokens": 16416504} {"current_steps": 25140, "total_steps": 33920, "loss": 0.3733, "lr": 1.9062276751281872e-06, "epoch": 14.82311320754717, "percentage": 74.12, "elapsed_time": "0:48:11", "remaining_time": "0:16:49", "throughput": 5678.88, "total_tokens": 16419000} {"current_steps": 25145, "total_steps": 33920, "loss": 0.4264, "lr": 1.9042070005895136e-06, "epoch": 14.826061320754716, "percentage": 74.13, "elapsed_time": "0:48:11", "remaining_time": "0:16:49", "throughput": 5679.08, "total_tokens": 16423064} {"current_steps": 25150, "total_steps": 33920, "loss": 0.2879, "lr": 1.9021871456753788e-06, "epoch": 14.829009433962264, "percentage": 74.15, "elapsed_time": "0:48:12", "remaining_time": "0:16:48", "throughput": 5679.12, "total_tokens": 16426200} {"current_steps": 25155, "total_steps": 33920, "loss": 0.2652, "lr": 1.9001681109205478e-06, "epoch": 14.83195754716981, "percentage": 74.16, "elapsed_time": "0:48:12", "remaining_time": "0:16:47", "throughput": 5679.1, "total_tokens": 16429048} {"current_steps": 25160, "total_steps": 33920, "loss": 0.426, "lr": 1.898149896859567e-06, "epoch": 14.834905660377359, "percentage": 74.17, "elapsed_time": "0:48:13", "remaining_time": "0:16:47", "throughput": 5678.98, "total_tokens": 16431768} {"current_steps": 25165, "total_steps": 33920, "loss": 0.2506, "lr": 1.8961325040267714e-06, "epoch": 14.837853773584905, "percentage": 74.19, "elapsed_time": "0:48:13", "remaining_time": "0:16:46", "throughput": 5679.02, "total_tokens": 16434904} {"current_steps": 25170, "total_steps": 33920, "loss": 0.2935, "lr": 1.894115932956272e-06, "epoch": 14.840801886792454, "percentage": 74.2, "elapsed_time": "0:48:14", "remaining_time": "0:16:46", "throughput": 5679.03, "total_tokens": 16437912} {"current_steps": 25175, "total_steps": 33920, "loss": 0.3062, "lr": 1.8921001841819652e-06, "epoch": 14.84375, "percentage": 74.22, "elapsed_time": "0:48:15", "remaining_time": "0:16:45", "throughput": 5679.09, "total_tokens": 16441208} {"current_steps": 25180, "total_steps": 33920, "loss": 0.3655, "lr": 1.8900852582375284e-06, "epoch": 14.846698113207546, "percentage": 74.23, "elapsed_time": "0:48:15", "remaining_time": "0:16:45", "throughput": 5679.12, "total_tokens": 16444568} {"current_steps": 25185, "total_steps": 33920, "loss": 0.2747, "lr": 1.8880711556564214e-06, "epoch": 14.849646226415095, "percentage": 74.25, "elapsed_time": "0:48:16", "remaining_time": "0:16:44", "throughput": 5679.23, "total_tokens": 16448216} {"current_steps": 25190, "total_steps": 33920, "loss": 0.3763, "lr": 1.8860578769718891e-06, "epoch": 14.852594339622641, "percentage": 74.26, "elapsed_time": "0:48:16", "remaining_time": "0:16:43", "throughput": 5679.16, "total_tokens": 16450712} {"current_steps": 25195, "total_steps": 33920, "loss": 0.398, "lr": 1.8840454227169525e-06, "epoch": 14.85554245283019, "percentage": 74.28, "elapsed_time": "0:48:17", "remaining_time": "0:16:43", "throughput": 5679.16, "total_tokens": 16453880} {"current_steps": 25200, "total_steps": 33920, "loss": 0.3009, "lr": 1.882033793424421e-06, "epoch": 14.858490566037736, "percentage": 74.29, "elapsed_time": "0:48:17", "remaining_time": "0:16:42", "throughput": 5679.21, "total_tokens": 16456856} {"current_steps": 25205, "total_steps": 33920, "loss": 0.2878, "lr": 1.88002298962688e-06, "epoch": 14.861438679245284, "percentage": 74.31, "elapsed_time": "0:48:18", "remaining_time": "0:16:42", "throughput": 5679.21, "total_tokens": 16459704} {"current_steps": 25210, "total_steps": 33920, "loss": 0.3166, "lr": 1.8780130118566996e-06, "epoch": 14.86438679245283, "percentage": 74.32, "elapsed_time": "0:48:18", "remaining_time": "0:16:41", "throughput": 5679.2, "total_tokens": 16462680} {"current_steps": 25215, "total_steps": 33920, "loss": 0.2231, "lr": 1.876003860646029e-06, "epoch": 14.867334905660378, "percentage": 74.34, "elapsed_time": "0:48:19", "remaining_time": "0:16:40", "throughput": 5679.08, "total_tokens": 16465528} {"current_steps": 25220, "total_steps": 33920, "loss": 0.319, "lr": 1.8739955365267997e-06, "epoch": 14.870283018867925, "percentage": 74.35, "elapsed_time": "0:48:19", "remaining_time": "0:16:40", "throughput": 5679.1, "total_tokens": 16468280} {"current_steps": 25225, "total_steps": 33920, "loss": 0.3685, "lr": 1.8719880400307228e-06, "epoch": 14.873231132075471, "percentage": 74.37, "elapsed_time": "0:48:20", "remaining_time": "0:16:39", "throughput": 5679.21, "total_tokens": 16471864} {"current_steps": 25230, "total_steps": 33920, "loss": 0.336, "lr": 1.869981371689295e-06, "epoch": 14.87617924528302, "percentage": 74.38, "elapsed_time": "0:48:21", "remaining_time": "0:16:39", "throughput": 5679.42, "total_tokens": 16475992} {"current_steps": 25235, "total_steps": 33920, "loss": 0.3583, "lr": 1.867975532033789e-06, "epoch": 14.879127358490566, "percentage": 74.4, "elapsed_time": "0:48:21", "remaining_time": "0:16:38", "throughput": 5679.61, "total_tokens": 16480120} {"current_steps": 25240, "total_steps": 33920, "loss": 0.301, "lr": 1.8659705215952589e-06, "epoch": 14.882075471698114, "percentage": 74.41, "elapsed_time": "0:48:22", "remaining_time": "0:16:38", "throughput": 5679.71, "total_tokens": 16483512} {"current_steps": 25245, "total_steps": 33920, "loss": 0.3772, "lr": 1.8639663409045405e-06, "epoch": 14.88502358490566, "percentage": 74.43, "elapsed_time": "0:48:22", "remaining_time": "0:16:37", "throughput": 5679.66, "total_tokens": 16486296} {"current_steps": 25250, "total_steps": 33920, "loss": 0.3067, "lr": 1.8619629904922466e-06, "epoch": 14.887971698113208, "percentage": 74.44, "elapsed_time": "0:48:23", "remaining_time": "0:16:36", "throughput": 5679.82, "total_tokens": 16490008} {"current_steps": 25255, "total_steps": 33920, "loss": 0.3912, "lr": 1.859960470888777e-06, "epoch": 14.890919811320755, "percentage": 74.45, "elapsed_time": "0:48:23", "remaining_time": "0:16:36", "throughput": 5679.79, "total_tokens": 16493112} {"current_steps": 25260, "total_steps": 33920, "loss": 0.5101, "lr": 1.857958782624306e-06, "epoch": 14.893867924528301, "percentage": 74.47, "elapsed_time": "0:48:24", "remaining_time": "0:16:35", "throughput": 5679.73, "total_tokens": 16495640} {"current_steps": 25265, "total_steps": 33920, "loss": 0.4065, "lr": 1.8559579262287886e-06, "epoch": 14.89681603773585, "percentage": 74.48, "elapsed_time": "0:48:24", "remaining_time": "0:16:35", "throughput": 5679.64, "total_tokens": 16498040} {"current_steps": 25270, "total_steps": 33920, "loss": 0.2834, "lr": 1.8539579022319599e-06, "epoch": 14.899764150943396, "percentage": 74.5, "elapsed_time": "0:48:25", "remaining_time": "0:16:34", "throughput": 5679.69, "total_tokens": 16501240} {"current_steps": 25275, "total_steps": 33920, "loss": 0.3418, "lr": 1.8519587111633357e-06, "epoch": 14.902712264150944, "percentage": 74.51, "elapsed_time": "0:48:25", "remaining_time": "0:16:33", "throughput": 5679.63, "total_tokens": 16503896} {"current_steps": 25280, "total_steps": 33920, "loss": 0.3834, "lr": 1.8499603535522082e-06, "epoch": 14.90566037735849, "percentage": 74.53, "elapsed_time": "0:48:26", "remaining_time": "0:16:33", "throughput": 5679.52, "total_tokens": 16506296} {"current_steps": 25285, "total_steps": 33920, "loss": 0.2442, "lr": 1.8479628299276543e-06, "epoch": 14.908608490566039, "percentage": 74.54, "elapsed_time": "0:48:26", "remaining_time": "0:16:32", "throughput": 5679.51, "total_tokens": 16509336} {"current_steps": 25290, "total_steps": 33920, "loss": 0.2495, "lr": 1.8459661408185241e-06, "epoch": 14.911556603773585, "percentage": 74.56, "elapsed_time": "0:48:27", "remaining_time": "0:16:32", "throughput": 5679.62, "total_tokens": 16512920} {"current_steps": 25295, "total_steps": 33920, "loss": 0.2916, "lr": 1.8439702867534536e-06, "epoch": 14.914504716981131, "percentage": 74.57, "elapsed_time": "0:48:27", "remaining_time": "0:16:31", "throughput": 5679.56, "total_tokens": 16515704} {"current_steps": 25300, "total_steps": 33920, "loss": 0.2867, "lr": 1.841975268260851e-06, "epoch": 14.91745283018868, "percentage": 74.59, "elapsed_time": "0:48:28", "remaining_time": "0:16:30", "throughput": 5679.56, "total_tokens": 16518360} {"current_steps": 25305, "total_steps": 33920, "loss": 0.4697, "lr": 1.8399810858689066e-06, "epoch": 14.920400943396226, "percentage": 74.6, "elapsed_time": "0:48:28", "remaining_time": "0:16:30", "throughput": 5679.38, "total_tokens": 16520888} {"current_steps": 25310, "total_steps": 33920, "loss": 0.278, "lr": 1.8379877401055884e-06, "epoch": 14.923349056603774, "percentage": 74.62, "elapsed_time": "0:48:29", "remaining_time": "0:16:29", "throughput": 5679.21, "total_tokens": 16523480} {"current_steps": 25315, "total_steps": 33920, "loss": 0.4943, "lr": 1.8359952314986418e-06, "epoch": 14.92629716981132, "percentage": 74.63, "elapsed_time": "0:48:29", "remaining_time": "0:16:29", "throughput": 5679.32, "total_tokens": 16526648} {"current_steps": 25320, "total_steps": 33920, "loss": 0.2614, "lr": 1.8340035605755957e-06, "epoch": 14.929245283018869, "percentage": 74.65, "elapsed_time": "0:48:30", "remaining_time": "0:16:28", "throughput": 5679.35, "total_tokens": 16529688} {"current_steps": 25325, "total_steps": 33920, "loss": 0.3373, "lr": 1.8320127278637518e-06, "epoch": 14.932193396226415, "percentage": 74.66, "elapsed_time": "0:48:31", "remaining_time": "0:16:27", "throughput": 5679.35, "total_tokens": 16533240} {"current_steps": 25330, "total_steps": 33920, "loss": 0.4166, "lr": 1.830022733890191e-06, "epoch": 14.935141509433961, "percentage": 74.68, "elapsed_time": "0:48:31", "remaining_time": "0:16:27", "throughput": 5679.39, "total_tokens": 16536344} {"current_steps": 25335, "total_steps": 33920, "loss": 0.2424, "lr": 1.8280335791817733e-06, "epoch": 14.93808962264151, "percentage": 74.69, "elapsed_time": "0:48:32", "remaining_time": "0:16:26", "throughput": 5679.34, "total_tokens": 16539224} {"current_steps": 25340, "total_steps": 33920, "loss": 0.2813, "lr": 1.826045264265136e-06, "epoch": 14.941037735849056, "percentage": 74.71, "elapsed_time": "0:48:32", "remaining_time": "0:16:26", "throughput": 5679.53, "total_tokens": 16543224} {"current_steps": 25345, "total_steps": 33920, "loss": 0.3727, "lr": 1.8240577896666928e-06, "epoch": 14.943985849056604, "percentage": 74.72, "elapsed_time": "0:48:33", "remaining_time": "0:16:25", "throughput": 5679.59, "total_tokens": 16546744} {"current_steps": 25350, "total_steps": 33920, "loss": 0.3105, "lr": 1.8220711559126382e-06, "epoch": 14.94693396226415, "percentage": 74.73, "elapsed_time": "0:48:33", "remaining_time": "0:16:25", "throughput": 5679.56, "total_tokens": 16549336} {"current_steps": 25355, "total_steps": 33920, "loss": 0.2301, "lr": 1.8200853635289417e-06, "epoch": 14.949882075471699, "percentage": 74.75, "elapsed_time": "0:48:34", "remaining_time": "0:16:24", "throughput": 5679.53, "total_tokens": 16552248} {"current_steps": 25360, "total_steps": 33920, "loss": 0.2863, "lr": 1.81810041304135e-06, "epoch": 14.952830188679245, "percentage": 74.76, "elapsed_time": "0:48:34", "remaining_time": "0:16:23", "throughput": 5679.64, "total_tokens": 16555800} {"current_steps": 25365, "total_steps": 33920, "loss": 0.3241, "lr": 1.8161163049753865e-06, "epoch": 14.955778301886792, "percentage": 74.78, "elapsed_time": "0:48:35", "remaining_time": "0:16:23", "throughput": 5679.57, "total_tokens": 16558904} {"current_steps": 25370, "total_steps": 33920, "loss": 0.3297, "lr": 1.8141330398563533e-06, "epoch": 14.95872641509434, "percentage": 74.79, "elapsed_time": "0:48:36", "remaining_time": "0:16:22", "throughput": 5679.53, "total_tokens": 16561880} {"current_steps": 25375, "total_steps": 33920, "loss": 0.3352, "lr": 1.8121506182093268e-06, "epoch": 14.961674528301886, "percentage": 74.81, "elapsed_time": "0:48:36", "remaining_time": "0:16:22", "throughput": 5679.64, "total_tokens": 16565176} {"current_steps": 25380, "total_steps": 33920, "loss": 0.3685, "lr": 1.8101690405591643e-06, "epoch": 14.964622641509434, "percentage": 74.82, "elapsed_time": "0:48:37", "remaining_time": "0:16:21", "throughput": 5679.6, "total_tokens": 16567864} {"current_steps": 25385, "total_steps": 33920, "loss": 0.2538, "lr": 1.8081883074304945e-06, "epoch": 14.96757075471698, "percentage": 74.84, "elapsed_time": "0:48:37", "remaining_time": "0:16:20", "throughput": 5679.64, "total_tokens": 16571256} {"current_steps": 25390, "total_steps": 33920, "loss": 0.2816, "lr": 1.8062084193477275e-06, "epoch": 14.970518867924529, "percentage": 74.85, "elapsed_time": "0:48:38", "remaining_time": "0:16:20", "throughput": 5679.71, "total_tokens": 16575224} {"current_steps": 25395, "total_steps": 33920, "loss": 0.2987, "lr": 1.804229376835046e-06, "epoch": 14.973466981132075, "percentage": 74.87, "elapsed_time": "0:48:39", "remaining_time": "0:16:19", "throughput": 5679.77, "total_tokens": 16580056} {"current_steps": 25400, "total_steps": 33920, "loss": 0.3798, "lr": 1.8022511804164105e-06, "epoch": 14.976415094339622, "percentage": 74.88, "elapsed_time": "0:48:39", "remaining_time": "0:16:19", "throughput": 5679.74, "total_tokens": 16583448} {"current_steps": 25405, "total_steps": 33920, "loss": 0.3536, "lr": 1.8002738306155559e-06, "epoch": 14.97936320754717, "percentage": 74.9, "elapsed_time": "0:48:40", "remaining_time": "0:16:18", "throughput": 5679.74, "total_tokens": 16586488} {"current_steps": 25410, "total_steps": 33920, "loss": 0.2914, "lr": 1.7982973279559935e-06, "epoch": 14.982311320754716, "percentage": 74.91, "elapsed_time": "0:48:40", "remaining_time": "0:16:18", "throughput": 5679.63, "total_tokens": 16589272} {"current_steps": 25415, "total_steps": 33920, "loss": 0.2614, "lr": 1.7963216729610134e-06, "epoch": 14.985259433962264, "percentage": 74.93, "elapsed_time": "0:48:41", "remaining_time": "0:16:17", "throughput": 5679.76, "total_tokens": 16593368} {"current_steps": 25420, "total_steps": 33920, "loss": 0.2487, "lr": 1.7943468661536773e-06, "epoch": 14.98820754716981, "percentage": 74.94, "elapsed_time": "0:48:41", "remaining_time": "0:16:17", "throughput": 5679.7, "total_tokens": 16596056} {"current_steps": 25425, "total_steps": 33920, "loss": 0.4671, "lr": 1.7923729080568242e-06, "epoch": 14.991155660377359, "percentage": 74.96, "elapsed_time": "0:48:42", "remaining_time": "0:16:16", "throughput": 5679.8, "total_tokens": 16599192} {"current_steps": 25430, "total_steps": 33920, "loss": 0.3711, "lr": 1.7903997991930683e-06, "epoch": 14.994103773584905, "percentage": 74.97, "elapsed_time": "0:48:43", "remaining_time": "0:16:15", "throughput": 5679.84, "total_tokens": 16602360} {"current_steps": 25435, "total_steps": 33920, "loss": 0.2845, "lr": 1.7884275400847972e-06, "epoch": 14.997051886792454, "percentage": 74.99, "elapsed_time": "0:48:43", "remaining_time": "0:16:15", "throughput": 5679.95, "total_tokens": 16605816} {"current_steps": 25440, "total_steps": 33920, "loss": 0.2957, "lr": 1.786456131254175e-06, "epoch": 15.0, "percentage": 75.0, "elapsed_time": "0:48:44", "remaining_time": "0:16:14", "throughput": 5679.56, "total_tokens": 16608128} {"current_steps": 25445, "total_steps": 33920, "loss": 0.3144, "lr": 1.784485573223143e-06, "epoch": 15.002948113207546, "percentage": 75.01, "elapsed_time": "0:48:44", "remaining_time": "0:16:14", "throughput": 5679.19, "total_tokens": 16611392} {"current_steps": 25450, "total_steps": 33920, "loss": 0.3029, "lr": 1.782515866513414e-06, "epoch": 15.005896226415095, "percentage": 75.03, "elapsed_time": "0:48:45", "remaining_time": "0:16:13", "throughput": 5679.32, "total_tokens": 16614944} {"current_steps": 25455, "total_steps": 33920, "loss": 0.2815, "lr": 1.7805470116464758e-06, "epoch": 15.008844339622641, "percentage": 75.04, "elapsed_time": "0:48:46", "remaining_time": "0:16:13", "throughput": 5679.45, "total_tokens": 16618240} {"current_steps": 25460, "total_steps": 33920, "loss": 0.29, "lr": 1.7785790091435911e-06, "epoch": 15.01179245283019, "percentage": 75.06, "elapsed_time": "0:48:46", "remaining_time": "0:16:12", "throughput": 5679.39, "total_tokens": 16620832} {"current_steps": 25465, "total_steps": 33920, "loss": 0.3699, "lr": 1.776611859525796e-06, "epoch": 15.014740566037736, "percentage": 75.07, "elapsed_time": "0:48:47", "remaining_time": "0:16:11", "throughput": 5679.34, "total_tokens": 16623616} {"current_steps": 25470, "total_steps": 33920, "loss": 0.3083, "lr": 1.7746455633139042e-06, "epoch": 15.017688679245284, "percentage": 75.09, "elapsed_time": "0:48:47", "remaining_time": "0:16:11", "throughput": 5679.39, "total_tokens": 16626560} {"current_steps": 25475, "total_steps": 33920, "loss": 0.4059, "lr": 1.7726801210285005e-06, "epoch": 15.02063679245283, "percentage": 75.1, "elapsed_time": "0:48:48", "remaining_time": "0:16:10", "throughput": 5679.41, "total_tokens": 16629632} {"current_steps": 25480, "total_steps": 33920, "loss": 0.3657, "lr": 1.7707155331899418e-06, "epoch": 15.023584905660377, "percentage": 75.12, "elapsed_time": "0:48:48", "remaining_time": "0:16:10", "throughput": 5679.49, "total_tokens": 16632576} {"current_steps": 25485, "total_steps": 33920, "loss": 0.2627, "lr": 1.7687518003183645e-06, "epoch": 15.026533018867925, "percentage": 75.13, "elapsed_time": "0:48:49", "remaining_time": "0:16:09", "throughput": 5679.76, "total_tokens": 16637632} {"current_steps": 25490, "total_steps": 33920, "loss": 0.2495, "lr": 1.766788922933675e-06, "epoch": 15.029481132075471, "percentage": 75.15, "elapsed_time": "0:48:49", "remaining_time": "0:16:08", "throughput": 5679.7, "total_tokens": 16640192} {"current_steps": 25495, "total_steps": 33920, "loss": 0.3387, "lr": 1.7648269015555514e-06, "epoch": 15.03242924528302, "percentage": 75.16, "elapsed_time": "0:48:50", "remaining_time": "0:16:08", "throughput": 5679.72, "total_tokens": 16643200} {"current_steps": 25500, "total_steps": 33920, "loss": 0.2781, "lr": 1.7628657367034474e-06, "epoch": 15.035377358490566, "percentage": 75.18, "elapsed_time": "0:48:50", "remaining_time": "0:16:07", "throughput": 5679.98, "total_tokens": 16647584} {"current_steps": 25505, "total_steps": 33920, "loss": 0.3434, "lr": 1.7609054288965922e-06, "epoch": 15.038325471698114, "percentage": 75.19, "elapsed_time": "0:48:51", "remaining_time": "0:16:07", "throughput": 5680.01, "total_tokens": 16650592} {"current_steps": 25510, "total_steps": 33920, "loss": 0.2704, "lr": 1.7589459786539847e-06, "epoch": 15.04127358490566, "percentage": 75.21, "elapsed_time": "0:48:51", "remaining_time": "0:16:06", "throughput": 5680.1, "total_tokens": 16653824} {"current_steps": 25515, "total_steps": 33920, "loss": 0.3218, "lr": 1.7569873864943975e-06, "epoch": 15.044221698113208, "percentage": 75.22, "elapsed_time": "0:48:52", "remaining_time": "0:16:06", "throughput": 5680.38, "total_tokens": 16658624} {"current_steps": 25520, "total_steps": 33920, "loss": 0.2467, "lr": 1.7550296529363764e-06, "epoch": 15.047169811320755, "percentage": 75.24, "elapsed_time": "0:48:53", "remaining_time": "0:16:05", "throughput": 5680.49, "total_tokens": 16662144} {"current_steps": 25525, "total_steps": 33920, "loss": 0.3154, "lr": 1.7530727784982393e-06, "epoch": 15.050117924528301, "percentage": 75.25, "elapsed_time": "0:48:53", "remaining_time": "0:16:04", "throughput": 5680.72, "total_tokens": 16666208} {"current_steps": 25530, "total_steps": 33920, "loss": 0.2863, "lr": 1.7511167636980765e-06, "epoch": 15.05306603773585, "percentage": 75.27, "elapsed_time": "0:48:54", "remaining_time": "0:16:04", "throughput": 5680.83, "total_tokens": 16669728} {"current_steps": 25535, "total_steps": 33920, "loss": 0.2888, "lr": 1.7491616090537539e-06, "epoch": 15.056014150943396, "percentage": 75.28, "elapsed_time": "0:48:54", "remaining_time": "0:16:03", "throughput": 5680.94, "total_tokens": 16673120} {"current_steps": 25540, "total_steps": 33920, "loss": 0.3318, "lr": 1.7472073150829056e-06, "epoch": 15.058962264150944, "percentage": 75.29, "elapsed_time": "0:48:55", "remaining_time": "0:16:03", "throughput": 5681.11, "total_tokens": 16678144} {"current_steps": 25545, "total_steps": 33920, "loss": 0.3733, "lr": 1.745253882302939e-06, "epoch": 15.06191037735849, "percentage": 75.31, "elapsed_time": "0:48:56", "remaining_time": "0:16:02", "throughput": 5681.14, "total_tokens": 16681312} {"current_steps": 25550, "total_steps": 33920, "loss": 0.305, "lr": 1.743301311231035e-06, "epoch": 15.064858490566039, "percentage": 75.32, "elapsed_time": "0:48:56", "remaining_time": "0:16:02", "throughput": 5681.23, "total_tokens": 16685216} {"current_steps": 25555, "total_steps": 33920, "loss": 0.2366, "lr": 1.7413496023841437e-06, "epoch": 15.067806603773585, "percentage": 75.34, "elapsed_time": "0:48:57", "remaining_time": "0:16:01", "throughput": 5681.31, "total_tokens": 16688736} {"current_steps": 25560, "total_steps": 33920, "loss": 0.2316, "lr": 1.7393987562789876e-06, "epoch": 15.070754716981131, "percentage": 75.35, "elapsed_time": "0:48:58", "remaining_time": "0:16:00", "throughput": 5681.33, "total_tokens": 16692000} {"current_steps": 25565, "total_steps": 33920, "loss": 0.3287, "lr": 1.7374487734320655e-06, "epoch": 15.07370283018868, "percentage": 75.37, "elapsed_time": "0:48:58", "remaining_time": "0:16:00", "throughput": 5681.28, "total_tokens": 16694912} {"current_steps": 25570, "total_steps": 33920, "loss": 0.2694, "lr": 1.7354996543596408e-06, "epoch": 15.076650943396226, "percentage": 75.38, "elapsed_time": "0:48:59", "remaining_time": "0:15:59", "throughput": 5681.33, "total_tokens": 16698016} {"current_steps": 25575, "total_steps": 33920, "loss": 0.2626, "lr": 1.7335513995777504e-06, "epoch": 15.079599056603774, "percentage": 75.4, "elapsed_time": "0:48:59", "remaining_time": "0:15:59", "throughput": 5681.29, "total_tokens": 16701088} {"current_steps": 25580, "total_steps": 33920, "loss": 0.364, "lr": 1.7316040096022062e-06, "epoch": 15.08254716981132, "percentage": 75.41, "elapsed_time": "0:49:00", "remaining_time": "0:15:58", "throughput": 5681.15, "total_tokens": 16703552} {"current_steps": 25585, "total_steps": 33920, "loss": 0.284, "lr": 1.7296574849485863e-06, "epoch": 15.085495283018869, "percentage": 75.43, "elapsed_time": "0:49:00", "remaining_time": "0:15:58", "throughput": 5681.22, "total_tokens": 16706848} {"current_steps": 25590, "total_steps": 33920, "loss": 0.2834, "lr": 1.7277118261322423e-06, "epoch": 15.088443396226415, "percentage": 75.44, "elapsed_time": "0:49:01", "remaining_time": "0:15:57", "throughput": 5681.17, "total_tokens": 16709664} {"current_steps": 25595, "total_steps": 33920, "loss": 0.2542, "lr": 1.7257670336682925e-06, "epoch": 15.091391509433961, "percentage": 75.46, "elapsed_time": "0:49:01", "remaining_time": "0:15:56", "throughput": 5681.19, "total_tokens": 16712896} {"current_steps": 25600, "total_steps": 33920, "loss": 0.4803, "lr": 1.7238231080716339e-06, "epoch": 15.09433962264151, "percentage": 75.47, "elapsed_time": "0:49:02", "remaining_time": "0:15:56", "throughput": 5681.08, "total_tokens": 16715680} {"current_steps": 25605, "total_steps": 33920, "loss": 0.3053, "lr": 1.721880049856927e-06, "epoch": 15.097287735849056, "percentage": 75.49, "elapsed_time": "0:49:02", "remaining_time": "0:15:55", "throughput": 5681.02, "total_tokens": 16718848} {"current_steps": 25610, "total_steps": 33920, "loss": 0.2962, "lr": 1.7199378595386046e-06, "epoch": 15.100235849056604, "percentage": 75.5, "elapsed_time": "0:49:03", "remaining_time": "0:15:55", "throughput": 5680.96, "total_tokens": 16721600} {"current_steps": 25615, "total_steps": 33920, "loss": 0.2975, "lr": 1.7179965376308705e-06, "epoch": 15.10318396226415, "percentage": 75.52, "elapsed_time": "0:49:03", "remaining_time": "0:15:54", "throughput": 5680.8, "total_tokens": 16724224} {"current_steps": 25620, "total_steps": 33920, "loss": 0.2512, "lr": 1.7160560846476976e-06, "epoch": 15.106132075471699, "percentage": 75.53, "elapsed_time": "0:49:04", "remaining_time": "0:15:53", "throughput": 5680.9, "total_tokens": 16728096} {"current_steps": 25625, "total_steps": 33920, "loss": 0.2439, "lr": 1.7141165011028277e-06, "epoch": 15.109080188679245, "percentage": 75.55, "elapsed_time": "0:49:05", "remaining_time": "0:15:53", "throughput": 5680.96, "total_tokens": 16731168} {"current_steps": 25630, "total_steps": 33920, "loss": 0.2955, "lr": 1.7121777875097767e-06, "epoch": 15.112028301886792, "percentage": 75.56, "elapsed_time": "0:49:05", "remaining_time": "0:15:52", "throughput": 5681.08, "total_tokens": 16734720} {"current_steps": 25635, "total_steps": 33920, "loss": 0.2936, "lr": 1.7102399443818268e-06, "epoch": 15.11497641509434, "percentage": 75.57, "elapsed_time": "0:49:06", "remaining_time": "0:15:52", "throughput": 5681.2, "total_tokens": 16738496} {"current_steps": 25640, "total_steps": 33920, "loss": 0.4011, "lr": 1.7083029722320294e-06, "epoch": 15.117924528301886, "percentage": 75.59, "elapsed_time": "0:49:06", "remaining_time": "0:15:51", "throughput": 5681.42, "total_tokens": 16742848} {"current_steps": 25645, "total_steps": 33920, "loss": 0.3005, "lr": 1.7063668715732063e-06, "epoch": 15.120872641509434, "percentage": 75.6, "elapsed_time": "0:49:07", "remaining_time": "0:15:51", "throughput": 5681.5, "total_tokens": 16746240} {"current_steps": 25650, "total_steps": 33920, "loss": 0.3792, "lr": 1.7044316429179492e-06, "epoch": 15.12382075471698, "percentage": 75.62, "elapsed_time": "0:49:08", "remaining_time": "0:15:50", "throughput": 5681.7, "total_tokens": 16750528} {"current_steps": 25655, "total_steps": 33920, "loss": 0.2816, "lr": 1.7024972867786155e-06, "epoch": 15.126768867924529, "percentage": 75.63, "elapsed_time": "0:49:08", "remaining_time": "0:15:50", "throughput": 5682.03, "total_tokens": 16755680} {"current_steps": 25660, "total_steps": 33920, "loss": 0.2923, "lr": 1.7005638036673389e-06, "epoch": 15.129716981132075, "percentage": 75.65, "elapsed_time": "0:49:09", "remaining_time": "0:15:49", "throughput": 5681.99, "total_tokens": 16758432} {"current_steps": 25665, "total_steps": 33920, "loss": 0.3664, "lr": 1.6986311940960148e-06, "epoch": 15.132665094339623, "percentage": 75.66, "elapsed_time": "0:49:09", "remaining_time": "0:15:48", "throughput": 5681.77, "total_tokens": 16760896} {"current_steps": 25670, "total_steps": 33920, "loss": 0.3304, "lr": 1.696699458576308e-06, "epoch": 15.13561320754717, "percentage": 75.68, "elapsed_time": "0:49:10", "remaining_time": "0:15:48", "throughput": 5681.85, "total_tokens": 16764032} {"current_steps": 25675, "total_steps": 33920, "loss": 0.3979, "lr": 1.6947685976196581e-06, "epoch": 15.138561320754716, "percentage": 75.69, "elapsed_time": "0:49:10", "remaining_time": "0:15:47", "throughput": 5681.81, "total_tokens": 16766912} {"current_steps": 25680, "total_steps": 33920, "loss": 0.3337, "lr": 1.692838611737267e-06, "epoch": 15.141509433962264, "percentage": 75.71, "elapsed_time": "0:49:11", "remaining_time": "0:15:47", "throughput": 5681.89, "total_tokens": 16770304} {"current_steps": 25685, "total_steps": 33920, "loss": 0.3284, "lr": 1.690909501440106e-06, "epoch": 15.14445754716981, "percentage": 75.72, "elapsed_time": "0:49:12", "remaining_time": "0:15:46", "throughput": 5681.79, "total_tokens": 16772768} {"current_steps": 25690, "total_steps": 33920, "loss": 0.2909, "lr": 1.688981267238915e-06, "epoch": 15.147405660377359, "percentage": 75.74, "elapsed_time": "0:49:12", "remaining_time": "0:15:45", "throughput": 5681.77, "total_tokens": 16775936} {"current_steps": 25695, "total_steps": 33920, "loss": 0.3852, "lr": 1.687053909644204e-06, "epoch": 15.150353773584905, "percentage": 75.75, "elapsed_time": "0:49:13", "remaining_time": "0:15:45", "throughput": 5681.72, "total_tokens": 16778784} {"current_steps": 25700, "total_steps": 33920, "loss": 0.3124, "lr": 1.685127429166249e-06, "epoch": 15.153301886792454, "percentage": 75.77, "elapsed_time": "0:49:13", "remaining_time": "0:15:44", "throughput": 5681.85, "total_tokens": 16782176} {"current_steps": 25705, "total_steps": 33920, "loss": 0.389, "lr": 1.683201826315093e-06, "epoch": 15.15625, "percentage": 75.78, "elapsed_time": "0:49:14", "remaining_time": "0:15:44", "throughput": 5681.91, "total_tokens": 16785344} {"current_steps": 25710, "total_steps": 33920, "loss": 0.4336, "lr": 1.681277101600548e-06, "epoch": 15.159198113207546, "percentage": 75.8, "elapsed_time": "0:49:14", "remaining_time": "0:15:43", "throughput": 5681.75, "total_tokens": 16788032} {"current_steps": 25715, "total_steps": 33920, "loss": 0.3817, "lr": 1.6793532555321939e-06, "epoch": 15.162146226415095, "percentage": 75.81, "elapsed_time": "0:49:15", "remaining_time": "0:15:42", "throughput": 5681.86, "total_tokens": 16791648} {"current_steps": 25720, "total_steps": 33920, "loss": 0.4318, "lr": 1.6774302886193744e-06, "epoch": 15.165094339622641, "percentage": 75.83, "elapsed_time": "0:49:15", "remaining_time": "0:15:42", "throughput": 5681.8, "total_tokens": 16794368} {"current_steps": 25725, "total_steps": 33920, "loss": 0.3124, "lr": 1.6755082013712076e-06, "epoch": 15.16804245283019, "percentage": 75.84, "elapsed_time": "0:49:16", "remaining_time": "0:15:41", "throughput": 5681.59, "total_tokens": 16796640} {"current_steps": 25730, "total_steps": 33920, "loss": 0.3717, "lr": 1.6735869942965716e-06, "epoch": 15.170990566037736, "percentage": 75.85, "elapsed_time": "0:49:16", "remaining_time": "0:15:41", "throughput": 5681.51, "total_tokens": 16799616} {"current_steps": 25735, "total_steps": 33920, "loss": 0.3702, "lr": 1.6716666679041155e-06, "epoch": 15.173938679245284, "percentage": 75.87, "elapsed_time": "0:49:17", "remaining_time": "0:15:40", "throughput": 5681.49, "total_tokens": 16802784} {"current_steps": 25740, "total_steps": 33920, "loss": 0.2783, "lr": 1.6697472227022533e-06, "epoch": 15.17688679245283, "percentage": 75.88, "elapsed_time": "0:49:17", "remaining_time": "0:15:40", "throughput": 5681.44, "total_tokens": 16805568} {"current_steps": 25745, "total_steps": 33920, "loss": 0.2429, "lr": 1.6678286591991644e-06, "epoch": 15.179834905660377, "percentage": 75.9, "elapsed_time": "0:49:18", "remaining_time": "0:15:39", "throughput": 5681.53, "total_tokens": 16809312} {"current_steps": 25750, "total_steps": 33920, "loss": 0.4033, "lr": 1.665910977902801e-06, "epoch": 15.182783018867925, "percentage": 75.91, "elapsed_time": "0:49:19", "remaining_time": "0:15:38", "throughput": 5681.23, "total_tokens": 16811328} {"current_steps": 25755, "total_steps": 33920, "loss": 0.357, "lr": 1.6639941793208747e-06, "epoch": 15.185731132075471, "percentage": 75.93, "elapsed_time": "0:49:19", "remaining_time": "0:15:38", "throughput": 5681.15, "total_tokens": 16814144} {"current_steps": 25760, "total_steps": 33920, "loss": 0.2642, "lr": 1.6620782639608674e-06, "epoch": 15.18867924528302, "percentage": 75.94, "elapsed_time": "0:49:20", "remaining_time": "0:15:37", "throughput": 5681.13, "total_tokens": 16817248} {"current_steps": 25765, "total_steps": 33920, "loss": 0.3698, "lr": 1.6601632323300231e-06, "epoch": 15.191627358490566, "percentage": 75.96, "elapsed_time": "0:49:20", "remaining_time": "0:15:37", "throughput": 5681.22, "total_tokens": 16820800} {"current_steps": 25770, "total_steps": 33920, "loss": 0.3494, "lr": 1.6582490849353595e-06, "epoch": 15.194575471698114, "percentage": 75.97, "elapsed_time": "0:49:21", "remaining_time": "0:15:36", "throughput": 5681.13, "total_tokens": 16823872} {"current_steps": 25775, "total_steps": 33920, "loss": 0.4361, "lr": 1.6563358222836523e-06, "epoch": 15.19752358490566, "percentage": 75.99, "elapsed_time": "0:49:21", "remaining_time": "0:15:35", "throughput": 5680.95, "total_tokens": 16826560} {"current_steps": 25780, "total_steps": 33920, "loss": 0.353, "lr": 1.654423444881445e-06, "epoch": 15.200471698113208, "percentage": 76.0, "elapsed_time": "0:49:22", "remaining_time": "0:15:35", "throughput": 5681.05, "total_tokens": 16829920} {"current_steps": 25785, "total_steps": 33920, "loss": 0.4059, "lr": 1.652511953235051e-06, "epoch": 15.203419811320755, "percentage": 76.02, "elapsed_time": "0:49:23", "remaining_time": "0:15:34", "throughput": 5681.11, "total_tokens": 16833280} {"current_steps": 25790, "total_steps": 33920, "loss": 0.2628, "lr": 1.650601347850544e-06, "epoch": 15.206367924528301, "percentage": 76.03, "elapsed_time": "0:49:23", "remaining_time": "0:15:34", "throughput": 5681.24, "total_tokens": 16837088} {"current_steps": 25795, "total_steps": 33920, "loss": 0.2907, "lr": 1.6486916292337652e-06, "epoch": 15.20931603773585, "percentage": 76.05, "elapsed_time": "0:49:24", "remaining_time": "0:15:33", "throughput": 5681.39, "total_tokens": 16841024} {"current_steps": 25800, "total_steps": 33920, "loss": 0.285, "lr": 1.6467827978903212e-06, "epoch": 15.212264150943396, "percentage": 76.06, "elapsed_time": "0:49:24", "remaining_time": "0:15:33", "throughput": 5681.25, "total_tokens": 16843648} {"current_steps": 25805, "total_steps": 33920, "loss": 0.2227, "lr": 1.6448748543255827e-06, "epoch": 15.215212264150944, "percentage": 76.08, "elapsed_time": "0:49:25", "remaining_time": "0:15:32", "throughput": 5681.24, "total_tokens": 16846528} {"current_steps": 25810, "total_steps": 33920, "loss": 0.2729, "lr": 1.6429677990446845e-06, "epoch": 15.21816037735849, "percentage": 76.09, "elapsed_time": "0:49:25", "remaining_time": "0:15:31", "throughput": 5681.13, "total_tokens": 16849152} {"current_steps": 25815, "total_steps": 33920, "loss": 0.2593, "lr": 1.6410616325525319e-06, "epoch": 15.221108490566039, "percentage": 76.11, "elapsed_time": "0:49:26", "remaining_time": "0:15:31", "throughput": 5681.2, "total_tokens": 16853312} {"current_steps": 25820, "total_steps": 33920, "loss": 0.2888, "lr": 1.6391563553537875e-06, "epoch": 15.224056603773585, "percentage": 76.12, "elapsed_time": "0:49:27", "remaining_time": "0:15:30", "throughput": 5681.05, "total_tokens": 16855968} {"current_steps": 25825, "total_steps": 33920, "loss": 0.2297, "lr": 1.6372519679528832e-06, "epoch": 15.227004716981131, "percentage": 76.14, "elapsed_time": "0:49:27", "remaining_time": "0:15:30", "throughput": 5680.97, "total_tokens": 16858816} {"current_steps": 25830, "total_steps": 33920, "loss": 0.284, "lr": 1.6353484708540124e-06, "epoch": 15.22995283018868, "percentage": 76.15, "elapsed_time": "0:49:28", "remaining_time": "0:15:29", "throughput": 5681.04, "total_tokens": 16862240} {"current_steps": 25835, "total_steps": 33920, "loss": 0.216, "lr": 1.633445864561135e-06, "epoch": 15.232900943396226, "percentage": 76.16, "elapsed_time": "0:49:28", "remaining_time": "0:15:29", "throughput": 5681.02, "total_tokens": 16865312} {"current_steps": 25840, "total_steps": 33920, "loss": 0.3221, "lr": 1.6315441495779726e-06, "epoch": 15.235849056603774, "percentage": 76.18, "elapsed_time": "0:49:29", "remaining_time": "0:15:28", "throughput": 5680.94, "total_tokens": 16867936} {"current_steps": 25845, "total_steps": 33920, "loss": 0.3484, "lr": 1.6296433264080152e-06, "epoch": 15.23879716981132, "percentage": 76.19, "elapsed_time": "0:49:29", "remaining_time": "0:15:27", "throughput": 5681.07, "total_tokens": 16871968} {"current_steps": 25850, "total_steps": 33920, "loss": 0.2495, "lr": 1.627743395554513e-06, "epoch": 15.241745283018869, "percentage": 76.21, "elapsed_time": "0:49:30", "remaining_time": "0:15:27", "throughput": 5680.88, "total_tokens": 16874464} {"current_steps": 25855, "total_steps": 33920, "loss": 0.3398, "lr": 1.6258443575204802e-06, "epoch": 15.244693396226415, "percentage": 76.22, "elapsed_time": "0:49:31", "remaining_time": "0:15:26", "throughput": 5680.93, "total_tokens": 16878304} {"current_steps": 25860, "total_steps": 33920, "loss": 0.4084, "lr": 1.6239462128086936e-06, "epoch": 15.247641509433961, "percentage": 76.24, "elapsed_time": "0:49:31", "remaining_time": "0:15:26", "throughput": 5680.87, "total_tokens": 16880992} {"current_steps": 25865, "total_steps": 33920, "loss": 0.305, "lr": 1.6220489619216988e-06, "epoch": 15.25058962264151, "percentage": 76.25, "elapsed_time": "0:49:32", "remaining_time": "0:15:25", "throughput": 5680.97, "total_tokens": 16884416} {"current_steps": 25870, "total_steps": 33920, "loss": 0.3347, "lr": 1.6201526053618e-06, "epoch": 15.253537735849056, "percentage": 76.27, "elapsed_time": "0:49:32", "remaining_time": "0:15:25", "throughput": 5681.33, "total_tokens": 16890112} {"current_steps": 25875, "total_steps": 33920, "loss": 0.2463, "lr": 1.6182571436310634e-06, "epoch": 15.256485849056604, "percentage": 76.28, "elapsed_time": "0:49:33", "remaining_time": "0:15:24", "throughput": 5681.41, "total_tokens": 16893792} {"current_steps": 25880, "total_steps": 33920, "loss": 0.2625, "lr": 1.616362577231324e-06, "epoch": 15.25943396226415, "percentage": 76.3, "elapsed_time": "0:49:34", "remaining_time": "0:15:23", "throughput": 5681.48, "total_tokens": 16897376} {"current_steps": 25885, "total_steps": 33920, "loss": 0.2669, "lr": 1.614468906664175e-06, "epoch": 15.262382075471699, "percentage": 76.31, "elapsed_time": "0:49:34", "remaining_time": "0:15:23", "throughput": 5681.35, "total_tokens": 16899968} {"current_steps": 25890, "total_steps": 33920, "loss": 0.4096, "lr": 1.612576132430974e-06, "epoch": 15.265330188679245, "percentage": 76.33, "elapsed_time": "0:49:35", "remaining_time": "0:15:22", "throughput": 5681.34, "total_tokens": 16902944} {"current_steps": 25895, "total_steps": 33920, "loss": 0.2346, "lr": 1.6106842550328406e-06, "epoch": 15.268278301886792, "percentage": 76.34, "elapsed_time": "0:49:35", "remaining_time": "0:15:22", "throughput": 5681.26, "total_tokens": 16905664} {"current_steps": 25900, "total_steps": 33920, "loss": 0.2025, "lr": 1.6087932749706582e-06, "epoch": 15.27122641509434, "percentage": 76.36, "elapsed_time": "0:49:36", "remaining_time": "0:15:21", "throughput": 5681.55, "total_tokens": 16912096} {"current_steps": 25905, "total_steps": 33920, "loss": 0.2872, "lr": 1.6069031927450696e-06, "epoch": 15.274174528301886, "percentage": 76.37, "elapsed_time": "0:49:37", "remaining_time": "0:15:21", "throughput": 5681.68, "total_tokens": 16915616} {"current_steps": 25910, "total_steps": 33920, "loss": 0.2822, "lr": 1.605014008856486e-06, "epoch": 15.277122641509434, "percentage": 76.39, "elapsed_time": "0:49:37", "remaining_time": "0:15:20", "throughput": 5681.64, "total_tokens": 16919008} {"current_steps": 25915, "total_steps": 33920, "loss": 0.4182, "lr": 1.6031257238050745e-06, "epoch": 15.28007075471698, "percentage": 76.4, "elapsed_time": "0:49:38", "remaining_time": "0:15:19", "throughput": 5681.51, "total_tokens": 16921568} {"current_steps": 25920, "total_steps": 33920, "loss": 0.238, "lr": 1.601238338090768e-06, "epoch": 15.283018867924529, "percentage": 76.42, "elapsed_time": "0:49:38", "remaining_time": "0:15:19", "throughput": 5681.39, "total_tokens": 16924128} {"current_steps": 25925, "total_steps": 33920, "loss": 0.2561, "lr": 1.5993518522132595e-06, "epoch": 15.285966981132075, "percentage": 76.43, "elapsed_time": "0:49:39", "remaining_time": "0:15:18", "throughput": 5681.52, "total_tokens": 16927776} {"current_steps": 25930, "total_steps": 33920, "loss": 0.3429, "lr": 1.5974662666720037e-06, "epoch": 15.288915094339623, "percentage": 76.44, "elapsed_time": "0:49:39", "remaining_time": "0:15:18", "throughput": 5681.4, "total_tokens": 16930304} {"current_steps": 25935, "total_steps": 33920, "loss": 0.2773, "lr": 1.5955815819662162e-06, "epoch": 15.29186320754717, "percentage": 76.46, "elapsed_time": "0:49:40", "remaining_time": "0:15:17", "throughput": 5681.52, "total_tokens": 16933920} {"current_steps": 25940, "total_steps": 33920, "loss": 0.2703, "lr": 1.5936977985948788e-06, "epoch": 15.294811320754716, "percentage": 76.47, "elapsed_time": "0:49:41", "remaining_time": "0:15:17", "throughput": 5681.58, "total_tokens": 16937280} {"current_steps": 25945, "total_steps": 33920, "loss": 0.3939, "lr": 1.5918149170567298e-06, "epoch": 15.297759433962264, "percentage": 76.49, "elapsed_time": "0:49:41", "remaining_time": "0:15:16", "throughput": 5681.35, "total_tokens": 16939648} {"current_steps": 25950, "total_steps": 33920, "loss": 0.2569, "lr": 1.5899329378502698e-06, "epoch": 15.30070754716981, "percentage": 76.5, "elapsed_time": "0:49:42", "remaining_time": "0:15:15", "throughput": 5681.42, "total_tokens": 16943296} {"current_steps": 25955, "total_steps": 33920, "loss": 0.2147, "lr": 1.588051861473761e-06, "epoch": 15.303655660377359, "percentage": 76.52, "elapsed_time": "0:49:42", "remaining_time": "0:15:15", "throughput": 5681.41, "total_tokens": 16946016} {"current_steps": 25960, "total_steps": 33920, "loss": 0.3417, "lr": 1.5861716884252253e-06, "epoch": 15.306603773584905, "percentage": 76.53, "elapsed_time": "0:49:43", "remaining_time": "0:15:14", "throughput": 5681.46, "total_tokens": 16949248} {"current_steps": 25965, "total_steps": 33920, "loss": 0.2476, "lr": 1.5842924192024489e-06, "epoch": 15.309551886792454, "percentage": 76.55, "elapsed_time": "0:49:43", "remaining_time": "0:15:14", "throughput": 5681.39, "total_tokens": 16951968} {"current_steps": 25970, "total_steps": 33920, "loss": 0.431, "lr": 1.5824140543029742e-06, "epoch": 15.3125, "percentage": 76.56, "elapsed_time": "0:49:44", "remaining_time": "0:15:13", "throughput": 5681.52, "total_tokens": 16955360} {"current_steps": 25975, "total_steps": 33920, "loss": 0.3109, "lr": 1.5805365942241092e-06, "epoch": 15.315448113207546, "percentage": 76.58, "elapsed_time": "0:49:44", "remaining_time": "0:15:12", "throughput": 5681.61, "total_tokens": 16959040} {"current_steps": 25980, "total_steps": 33920, "loss": 0.4035, "lr": 1.5786600394629181e-06, "epoch": 15.318396226415095, "percentage": 76.59, "elapsed_time": "0:49:45", "remaining_time": "0:15:12", "throughput": 5681.88, "total_tokens": 16963456} {"current_steps": 25985, "total_steps": 33920, "loss": 0.315, "lr": 1.5767843905162261e-06, "epoch": 15.321344339622641, "percentage": 76.61, "elapsed_time": "0:49:46", "remaining_time": "0:15:11", "throughput": 5681.95, "total_tokens": 16966528} {"current_steps": 25990, "total_steps": 33920, "loss": 0.3156, "lr": 1.5749096478806209e-06, "epoch": 15.32429245283019, "percentage": 76.62, "elapsed_time": "0:49:46", "remaining_time": "0:15:11", "throughput": 5682.0, "total_tokens": 16969824} {"current_steps": 25995, "total_steps": 33920, "loss": 0.2571, "lr": 1.5730358120524452e-06, "epoch": 15.327240566037736, "percentage": 76.64, "elapsed_time": "0:49:47", "remaining_time": "0:15:10", "throughput": 5682.1, "total_tokens": 16973536} {"current_steps": 26000, "total_steps": 33920, "loss": 0.278, "lr": 1.5711628835278098e-06, "epoch": 15.330188679245284, "percentage": 76.65, "elapsed_time": "0:49:47", "remaining_time": "0:15:10", "throughput": 5681.87, "total_tokens": 16975808} {"current_steps": 26005, "total_steps": 33920, "loss": 0.2894, "lr": 1.5692908628025782e-06, "epoch": 15.33313679245283, "percentage": 76.67, "elapsed_time": "0:49:48", "remaining_time": "0:15:09", "throughput": 5681.82, "total_tokens": 16979200} {"current_steps": 26010, "total_steps": 33920, "loss": 0.3037, "lr": 1.5674197503723765e-06, "epoch": 15.336084905660377, "percentage": 76.68, "elapsed_time": "0:49:48", "remaining_time": "0:15:08", "throughput": 5681.78, "total_tokens": 16982048} {"current_steps": 26015, "total_steps": 33920, "loss": 0.2992, "lr": 1.5655495467325893e-06, "epoch": 15.339033018867925, "percentage": 76.7, "elapsed_time": "0:49:49", "remaining_time": "0:15:08", "throughput": 5681.6, "total_tokens": 16984608} {"current_steps": 26020, "total_steps": 33920, "loss": 0.2037, "lr": 1.5636802523783613e-06, "epoch": 15.341981132075471, "percentage": 76.71, "elapsed_time": "0:49:49", "remaining_time": "0:15:07", "throughput": 5681.57, "total_tokens": 16987456} {"current_steps": 26025, "total_steps": 33920, "loss": 0.3017, "lr": 1.5618118678045947e-06, "epoch": 15.34492924528302, "percentage": 76.72, "elapsed_time": "0:49:50", "remaining_time": "0:15:07", "throughput": 5681.52, "total_tokens": 16990048} {"current_steps": 26030, "total_steps": 33920, "loss": 0.3415, "lr": 1.5599443935059549e-06, "epoch": 15.347877358490566, "percentage": 76.74, "elapsed_time": "0:49:50", "remaining_time": "0:15:06", "throughput": 5681.5, "total_tokens": 16993024} {"current_steps": 26035, "total_steps": 33920, "loss": 0.2772, "lr": 1.5580778299768635e-06, "epoch": 15.350825471698114, "percentage": 76.75, "elapsed_time": "0:49:51", "remaining_time": "0:15:05", "throughput": 5681.38, "total_tokens": 16995552} {"current_steps": 26040, "total_steps": 33920, "loss": 0.3273, "lr": 1.5562121777114997e-06, "epoch": 15.35377358490566, "percentage": 76.77, "elapsed_time": "0:49:51", "remaining_time": "0:15:05", "throughput": 5681.46, "total_tokens": 16998848} {"current_steps": 26045, "total_steps": 33920, "loss": 0.3127, "lr": 1.5543474372038043e-06, "epoch": 15.356721698113208, "percentage": 76.78, "elapsed_time": "0:49:52", "remaining_time": "0:15:04", "throughput": 5681.42, "total_tokens": 17001792} {"current_steps": 26050, "total_steps": 33920, "loss": 0.3338, "lr": 1.5524836089474748e-06, "epoch": 15.359669811320755, "percentage": 76.8, "elapsed_time": "0:49:53", "remaining_time": "0:15:04", "throughput": 5681.35, "total_tokens": 17004576} {"current_steps": 26055, "total_steps": 33920, "loss": 0.3955, "lr": 1.5506206934359664e-06, "epoch": 15.362617924528301, "percentage": 76.81, "elapsed_time": "0:49:53", "remaining_time": "0:15:03", "throughput": 5681.55, "total_tokens": 17008736} {"current_steps": 26060, "total_steps": 33920, "loss": 0.2797, "lr": 1.5487586911624947e-06, "epoch": 15.36556603773585, "percentage": 76.83, "elapsed_time": "0:49:54", "remaining_time": "0:15:03", "throughput": 5681.61, "total_tokens": 17012128} {"current_steps": 26065, "total_steps": 33920, "loss": 0.3364, "lr": 1.5468976026200355e-06, "epoch": 15.368514150943396, "percentage": 76.84, "elapsed_time": "0:49:54", "remaining_time": "0:15:02", "throughput": 5681.69, "total_tokens": 17015584} {"current_steps": 26070, "total_steps": 33920, "loss": 0.3649, "lr": 1.5450374283013187e-06, "epoch": 15.371462264150944, "percentage": 76.86, "elapsed_time": "0:49:55", "remaining_time": "0:15:01", "throughput": 5681.82, "total_tokens": 17019456} {"current_steps": 26075, "total_steps": 33920, "loss": 0.2437, "lr": 1.5431781686988317e-06, "epoch": 15.37441037735849, "percentage": 76.87, "elapsed_time": "0:49:55", "remaining_time": "0:15:01", "throughput": 5681.83, "total_tokens": 17022272} {"current_steps": 26080, "total_steps": 33920, "loss": 0.3765, "lr": 1.5413198243048233e-06, "epoch": 15.377358490566039, "percentage": 76.89, "elapsed_time": "0:49:56", "remaining_time": "0:15:00", "throughput": 5681.93, "total_tokens": 17025856} {"current_steps": 26085, "total_steps": 33920, "loss": 0.3269, "lr": 1.5394623956112974e-06, "epoch": 15.380306603773585, "percentage": 76.9, "elapsed_time": "0:49:57", "remaining_time": "0:15:00", "throughput": 5682.01, "total_tokens": 17029024} {"current_steps": 26090, "total_steps": 33920, "loss": 0.4038, "lr": 1.537605883110015e-06, "epoch": 15.383254716981131, "percentage": 76.92, "elapsed_time": "0:49:57", "remaining_time": "0:14:59", "throughput": 5682.21, "total_tokens": 17033056} {"current_steps": 26095, "total_steps": 33920, "loss": 0.361, "lr": 1.5357502872924984e-06, "epoch": 15.38620283018868, "percentage": 76.93, "elapsed_time": "0:49:58", "remaining_time": "0:14:59", "throughput": 5682.05, "total_tokens": 17035488} {"current_steps": 26100, "total_steps": 33920, "loss": 0.2865, "lr": 1.5338956086500235e-06, "epoch": 15.389150943396226, "percentage": 76.95, "elapsed_time": "0:49:58", "remaining_time": "0:14:58", "throughput": 5682.16, "total_tokens": 17039296} {"current_steps": 26105, "total_steps": 33920, "loss": 0.3838, "lr": 1.5320418476736237e-06, "epoch": 15.392099056603774, "percentage": 76.96, "elapsed_time": "0:49:59", "remaining_time": "0:14:57", "throughput": 5682.25, "total_tokens": 17043104} {"current_steps": 26110, "total_steps": 33920, "loss": 0.2337, "lr": 1.5301890048540912e-06, "epoch": 15.39504716981132, "percentage": 76.98, "elapsed_time": "0:49:59", "remaining_time": "0:14:57", "throughput": 5682.22, "total_tokens": 17046080} {"current_steps": 26115, "total_steps": 33920, "loss": 0.3338, "lr": 1.5283370806819743e-06, "epoch": 15.397995283018869, "percentage": 76.99, "elapsed_time": "0:50:00", "remaining_time": "0:14:56", "throughput": 5682.17, "total_tokens": 17048768} {"current_steps": 26120, "total_steps": 33920, "loss": 0.2568, "lr": 1.5264860756475752e-06, "epoch": 15.400943396226415, "percentage": 77.0, "elapsed_time": "0:50:00", "remaining_time": "0:14:56", "throughput": 5682.09, "total_tokens": 17051680} {"current_steps": 26125, "total_steps": 33920, "loss": 0.2933, "lr": 1.5246359902409592e-06, "epoch": 15.403891509433961, "percentage": 77.02, "elapsed_time": "0:50:01", "remaining_time": "0:14:55", "throughput": 5682.11, "total_tokens": 17054944} {"current_steps": 26130, "total_steps": 33920, "loss": 0.3394, "lr": 1.5227868249519423e-06, "epoch": 15.40683962264151, "percentage": 77.03, "elapsed_time": "0:50:02", "remaining_time": "0:14:54", "throughput": 5682.15, "total_tokens": 17058048} {"current_steps": 26135, "total_steps": 33920, "loss": 0.2944, "lr": 1.5209385802700999e-06, "epoch": 15.409787735849056, "percentage": 77.05, "elapsed_time": "0:50:02", "remaining_time": "0:14:54", "throughput": 5682.11, "total_tokens": 17060960} {"current_steps": 26140, "total_steps": 33920, "loss": 0.2966, "lr": 1.5190912566847626e-06, "epoch": 15.412735849056604, "percentage": 77.06, "elapsed_time": "0:50:03", "remaining_time": "0:14:53", "throughput": 5682.25, "total_tokens": 17064992} {"current_steps": 26145, "total_steps": 33920, "loss": 0.2344, "lr": 1.5172448546850166e-06, "epoch": 15.41568396226415, "percentage": 77.08, "elapsed_time": "0:50:03", "remaining_time": "0:14:53", "throughput": 5682.24, "total_tokens": 17067936} {"current_steps": 26150, "total_steps": 33920, "loss": 0.2554, "lr": 1.515399374759704e-06, "epoch": 15.418632075471699, "percentage": 77.09, "elapsed_time": "0:50:04", "remaining_time": "0:14:52", "throughput": 5682.22, "total_tokens": 17071168} {"current_steps": 26155, "total_steps": 33920, "loss": 0.282, "lr": 1.513554817397424e-06, "epoch": 15.421580188679245, "percentage": 77.11, "elapsed_time": "0:50:04", "remaining_time": "0:14:52", "throughput": 5682.29, "total_tokens": 17074560} {"current_steps": 26160, "total_steps": 33920, "loss": 0.3104, "lr": 1.5117111830865338e-06, "epoch": 15.424528301886792, "percentage": 77.12, "elapsed_time": "0:50:05", "remaining_time": "0:14:51", "throughput": 5682.19, "total_tokens": 17077312} {"current_steps": 26165, "total_steps": 33920, "loss": 0.2123, "lr": 1.509868472315142e-06, "epoch": 15.42747641509434, "percentage": 77.14, "elapsed_time": "0:50:06", "remaining_time": "0:14:50", "throughput": 5682.16, "total_tokens": 17080608} {"current_steps": 26170, "total_steps": 33920, "loss": 0.2791, "lr": 1.508026685571113e-06, "epoch": 15.430424528301886, "percentage": 77.15, "elapsed_time": "0:50:06", "remaining_time": "0:14:50", "throughput": 5681.93, "total_tokens": 17083072} {"current_steps": 26175, "total_steps": 33920, "loss": 0.2194, "lr": 1.506185823342069e-06, "epoch": 15.433372641509434, "percentage": 77.17, "elapsed_time": "0:50:07", "remaining_time": "0:14:49", "throughput": 5681.87, "total_tokens": 17086208} {"current_steps": 26180, "total_steps": 33920, "loss": 0.3421, "lr": 1.504345886115386e-06, "epoch": 15.43632075471698, "percentage": 77.18, "elapsed_time": "0:50:07", "remaining_time": "0:14:49", "throughput": 5681.89, "total_tokens": 17089312} {"current_steps": 26185, "total_steps": 33920, "loss": 0.3095, "lr": 1.502506874378193e-06, "epoch": 15.439268867924529, "percentage": 77.2, "elapsed_time": "0:50:08", "remaining_time": "0:14:48", "throughput": 5681.86, "total_tokens": 17092576} {"current_steps": 26190, "total_steps": 33920, "loss": 0.4259, "lr": 1.5006687886173805e-06, "epoch": 15.442216981132075, "percentage": 77.21, "elapsed_time": "0:50:08", "remaining_time": "0:14:48", "throughput": 5682.04, "total_tokens": 17096896} {"current_steps": 26195, "total_steps": 33920, "loss": 0.2983, "lr": 1.498831629319587e-06, "epoch": 15.445165094339623, "percentage": 77.23, "elapsed_time": "0:50:09", "remaining_time": "0:14:47", "throughput": 5682.15, "total_tokens": 17100320} {"current_steps": 26200, "total_steps": 33920, "loss": 0.3975, "lr": 1.4969953969712087e-06, "epoch": 15.44811320754717, "percentage": 77.24, "elapsed_time": "0:50:10", "remaining_time": "0:14:46", "throughput": 5682.1, "total_tokens": 17103200} {"current_steps": 26205, "total_steps": 33920, "loss": 0.3394, "lr": 1.4951600920583963e-06, "epoch": 15.451061320754716, "percentage": 77.26, "elapsed_time": "0:50:10", "remaining_time": "0:14:46", "throughput": 5682.17, "total_tokens": 17106336} {"current_steps": 26210, "total_steps": 33920, "loss": 0.4025, "lr": 1.493325715067055e-06, "epoch": 15.454009433962264, "percentage": 77.27, "elapsed_time": "0:50:11", "remaining_time": "0:14:45", "throughput": 5682.23, "total_tokens": 17109728} {"current_steps": 26215, "total_steps": 33920, "loss": 0.3181, "lr": 1.4914922664828417e-06, "epoch": 15.45695754716981, "percentage": 77.28, "elapsed_time": "0:50:11", "remaining_time": "0:14:45", "throughput": 5682.22, "total_tokens": 17113152} {"current_steps": 26220, "total_steps": 33920, "loss": 0.342, "lr": 1.4896597467911732e-06, "epoch": 15.459905660377359, "percentage": 77.3, "elapsed_time": "0:50:12", "remaining_time": "0:14:44", "throughput": 5682.11, "total_tokens": 17115904} {"current_steps": 26225, "total_steps": 33920, "loss": 0.2785, "lr": 1.4878281564772156e-06, "epoch": 15.462853773584905, "percentage": 77.31, "elapsed_time": "0:50:12", "remaining_time": "0:14:44", "throughput": 5682.08, "total_tokens": 17118752} {"current_steps": 26230, "total_steps": 33920, "loss": 0.2652, "lr": 1.4859974960258898e-06, "epoch": 15.465801886792454, "percentage": 77.33, "elapsed_time": "0:50:13", "remaining_time": "0:14:43", "throughput": 5682.14, "total_tokens": 17121888} {"current_steps": 26235, "total_steps": 33920, "loss": 0.349, "lr": 1.4841677659218723e-06, "epoch": 15.46875, "percentage": 77.34, "elapsed_time": "0:50:13", "remaining_time": "0:14:42", "throughput": 5682.02, "total_tokens": 17124320} {"current_steps": 26240, "total_steps": 33920, "loss": 0.3724, "lr": 1.4823389666495886e-06, "epoch": 15.471698113207546, "percentage": 77.36, "elapsed_time": "0:50:14", "remaining_time": "0:14:42", "throughput": 5682.18, "total_tokens": 17128480} {"current_steps": 26245, "total_steps": 33920, "loss": 0.3636, "lr": 1.4805110986932258e-06, "epoch": 15.474646226415095, "percentage": 77.37, "elapsed_time": "0:50:15", "remaining_time": "0:14:41", "throughput": 5682.26, "total_tokens": 17132160} {"current_steps": 26250, "total_steps": 33920, "loss": 0.2759, "lr": 1.4786841625367166e-06, "epoch": 15.477594339622641, "percentage": 77.39, "elapsed_time": "0:50:15", "remaining_time": "0:14:41", "throughput": 5682.28, "total_tokens": 17135392} {"current_steps": 26255, "total_steps": 33920, "loss": 0.3144, "lr": 1.476858158663752e-06, "epoch": 15.48054245283019, "percentage": 77.4, "elapsed_time": "0:50:16", "remaining_time": "0:14:40", "throughput": 5682.4, "total_tokens": 17139232} {"current_steps": 26260, "total_steps": 33920, "loss": 0.3538, "lr": 1.4750330875577745e-06, "epoch": 15.483490566037736, "percentage": 77.42, "elapsed_time": "0:50:16", "remaining_time": "0:14:39", "throughput": 5682.55, "total_tokens": 17142976} {"current_steps": 26265, "total_steps": 33920, "loss": 0.2685, "lr": 1.4732089497019787e-06, "epoch": 15.486438679245284, "percentage": 77.43, "elapsed_time": "0:50:17", "remaining_time": "0:14:39", "throughput": 5682.51, "total_tokens": 17145824} {"current_steps": 26270, "total_steps": 33920, "loss": 0.2811, "lr": 1.471385745579313e-06, "epoch": 15.48938679245283, "percentage": 77.45, "elapsed_time": "0:50:17", "remaining_time": "0:14:38", "throughput": 5682.37, "total_tokens": 17148320} {"current_steps": 26275, "total_steps": 33920, "loss": 0.2491, "lr": 1.4695634756724775e-06, "epoch": 15.492334905660377, "percentage": 77.46, "elapsed_time": "0:50:18", "remaining_time": "0:14:38", "throughput": 5682.45, "total_tokens": 17151584} {"current_steps": 26280, "total_steps": 33920, "loss": 0.3467, "lr": 1.4677421404639281e-06, "epoch": 15.495283018867925, "percentage": 77.48, "elapsed_time": "0:50:18", "remaining_time": "0:14:37", "throughput": 5682.46, "total_tokens": 17154496} {"current_steps": 26285, "total_steps": 33920, "loss": 0.313, "lr": 1.4659217404358706e-06, "epoch": 15.498231132075471, "percentage": 77.49, "elapsed_time": "0:50:19", "remaining_time": "0:14:37", "throughput": 5682.42, "total_tokens": 17157376} {"current_steps": 26290, "total_steps": 33920, "loss": 0.4681, "lr": 1.4641022760702627e-06, "epoch": 15.50117924528302, "percentage": 77.51, "elapsed_time": "0:50:20", "remaining_time": "0:14:36", "throughput": 5682.61, "total_tokens": 17161792} {"current_steps": 26295, "total_steps": 33920, "loss": 0.2548, "lr": 1.4622837478488172e-06, "epoch": 15.504127358490566, "percentage": 77.52, "elapsed_time": "0:50:20", "remaining_time": "0:14:35", "throughput": 5682.55, "total_tokens": 17164992} {"current_steps": 26300, "total_steps": 33920, "loss": 0.422, "lr": 1.4604661562529953e-06, "epoch": 15.507075471698114, "percentage": 77.54, "elapsed_time": "0:50:21", "remaining_time": "0:14:35", "throughput": 5682.7, "total_tokens": 17168672} {"current_steps": 26305, "total_steps": 33920, "loss": 0.3129, "lr": 1.4586495017640119e-06, "epoch": 15.51002358490566, "percentage": 77.55, "elapsed_time": "0:50:21", "remaining_time": "0:14:34", "throughput": 5682.6, "total_tokens": 17171232} {"current_steps": 26310, "total_steps": 33920, "loss": 0.3671, "lr": 1.4568337848628366e-06, "epoch": 15.512971698113208, "percentage": 77.56, "elapsed_time": "0:50:22", "remaining_time": "0:14:34", "throughput": 5682.52, "total_tokens": 17174080} {"current_steps": 26315, "total_steps": 33920, "loss": 0.271, "lr": 1.4550190060301872e-06, "epoch": 15.515919811320755, "percentage": 77.58, "elapsed_time": "0:50:22", "remaining_time": "0:14:33", "throughput": 5682.62, "total_tokens": 17177728} {"current_steps": 26320, "total_steps": 33920, "loss": 0.2997, "lr": 1.4532051657465335e-06, "epoch": 15.518867924528301, "percentage": 77.59, "elapsed_time": "0:50:23", "remaining_time": "0:14:33", "throughput": 5682.65, "total_tokens": 17180768} {"current_steps": 26325, "total_steps": 33920, "loss": 0.3333, "lr": 1.4513922644920985e-06, "epoch": 15.52181603773585, "percentage": 77.61, "elapsed_time": "0:50:23", "remaining_time": "0:14:32", "throughput": 5682.49, "total_tokens": 17183200} {"current_steps": 26330, "total_steps": 33920, "loss": 0.2526, "lr": 1.4495803027468552e-06, "epoch": 15.524764150943396, "percentage": 77.62, "elapsed_time": "0:50:24", "remaining_time": "0:14:31", "throughput": 5682.43, "total_tokens": 17185888} {"current_steps": 26335, "total_steps": 33920, "loss": 0.2904, "lr": 1.4477692809905263e-06, "epoch": 15.527712264150944, "percentage": 77.64, "elapsed_time": "0:50:24", "remaining_time": "0:14:31", "throughput": 5682.46, "total_tokens": 17188960} {"current_steps": 26340, "total_steps": 33920, "loss": 0.3754, "lr": 1.4459591997025896e-06, "epoch": 15.53066037735849, "percentage": 77.65, "elapsed_time": "0:50:25", "remaining_time": "0:14:30", "throughput": 5682.6, "total_tokens": 17193024} {"current_steps": 26345, "total_steps": 33920, "loss": 0.3195, "lr": 1.4441500593622737e-06, "epoch": 15.533608490566039, "percentage": 77.67, "elapsed_time": "0:50:26", "remaining_time": "0:14:30", "throughput": 5682.73, "total_tokens": 17196672} {"current_steps": 26350, "total_steps": 33920, "loss": 0.3815, "lr": 1.4423418604485539e-06, "epoch": 15.536556603773585, "percentage": 77.68, "elapsed_time": "0:50:26", "remaining_time": "0:14:29", "throughput": 5682.72, "total_tokens": 17200192} {"current_steps": 26355, "total_steps": 33920, "loss": 0.3798, "lr": 1.4405346034401597e-06, "epoch": 15.539504716981131, "percentage": 77.7, "elapsed_time": "0:50:27", "remaining_time": "0:14:28", "throughput": 5682.81, "total_tokens": 17203616} {"current_steps": 26360, "total_steps": 33920, "loss": 0.2106, "lr": 1.4387282888155695e-06, "epoch": 15.54245283018868, "percentage": 77.71, "elapsed_time": "0:50:27", "remaining_time": "0:14:28", "throughput": 5682.59, "total_tokens": 17205920} {"current_steps": 26365, "total_steps": 33920, "loss": 0.3071, "lr": 1.436922917053013e-06, "epoch": 15.545400943396226, "percentage": 77.73, "elapsed_time": "0:50:28", "remaining_time": "0:14:27", "throughput": 5682.61, "total_tokens": 17209152} {"current_steps": 26370, "total_steps": 33920, "loss": 0.3295, "lr": 1.4351184886304686e-06, "epoch": 15.548349056603774, "percentage": 77.74, "elapsed_time": "0:50:29", "remaining_time": "0:14:27", "throughput": 5682.72, "total_tokens": 17213056} {"current_steps": 26375, "total_steps": 33920, "loss": 0.346, "lr": 1.4333150040256699e-06, "epoch": 15.55129716981132, "percentage": 77.76, "elapsed_time": "0:50:29", "remaining_time": "0:14:26", "throughput": 5682.68, "total_tokens": 17216032} {"current_steps": 26380, "total_steps": 33920, "loss": 0.2676, "lr": 1.4315124637160954e-06, "epoch": 15.554245283018869, "percentage": 77.77, "elapsed_time": "0:50:30", "remaining_time": "0:14:26", "throughput": 5682.95, "total_tokens": 17220640} {"current_steps": 26385, "total_steps": 33920, "loss": 0.3225, "lr": 1.4297108681789752e-06, "epoch": 15.557193396226415, "percentage": 77.79, "elapsed_time": "0:50:30", "remaining_time": "0:14:25", "throughput": 5682.91, "total_tokens": 17223520} {"current_steps": 26390, "total_steps": 33920, "loss": 0.32, "lr": 1.4279102178912902e-06, "epoch": 15.560141509433961, "percentage": 77.8, "elapsed_time": "0:50:31", "remaining_time": "0:14:24", "throughput": 5682.86, "total_tokens": 17226112} {"current_steps": 26395, "total_steps": 33920, "loss": 0.4329, "lr": 1.4261105133297693e-06, "epoch": 15.56308962264151, "percentage": 77.82, "elapsed_time": "0:50:31", "remaining_time": "0:14:24", "throughput": 5682.89, "total_tokens": 17229120} {"current_steps": 26400, "total_steps": 33920, "loss": 0.3536, "lr": 1.4243117549708913e-06, "epoch": 15.566037735849056, "percentage": 77.83, "elapsed_time": "0:50:32", "remaining_time": "0:14:23", "throughput": 5682.86, "total_tokens": 17232096} {"current_steps": 26405, "total_steps": 33920, "loss": 0.2398, "lr": 1.422513943290888e-06, "epoch": 15.568985849056604, "percentage": 77.84, "elapsed_time": "0:50:32", "remaining_time": "0:14:23", "throughput": 5683.01, "total_tokens": 17235744} {"current_steps": 26410, "total_steps": 33920, "loss": 0.3277, "lr": 1.4207170787657365e-06, "epoch": 15.57193396226415, "percentage": 77.86, "elapsed_time": "0:50:33", "remaining_time": "0:14:22", "throughput": 5683.01, "total_tokens": 17238656} {"current_steps": 26415, "total_steps": 33920, "loss": 0.3856, "lr": 1.4189211618711646e-06, "epoch": 15.574882075471699, "percentage": 77.87, "elapsed_time": "0:50:33", "remaining_time": "0:14:21", "throughput": 5683.11, "total_tokens": 17241952} {"current_steps": 26420, "total_steps": 33920, "loss": 0.2421, "lr": 1.417126193082648e-06, "epoch": 15.577830188679245, "percentage": 77.89, "elapsed_time": "0:50:34", "remaining_time": "0:14:21", "throughput": 5683.18, "total_tokens": 17245152} {"current_steps": 26425, "total_steps": 33920, "loss": 0.2122, "lr": 1.4153321728754133e-06, "epoch": 15.580778301886792, "percentage": 77.9, "elapsed_time": "0:50:34", "remaining_time": "0:14:20", "throughput": 5683.28, "total_tokens": 17248416} {"current_steps": 26430, "total_steps": 33920, "loss": 0.3111, "lr": 1.4135391017244338e-06, "epoch": 15.58372641509434, "percentage": 77.92, "elapsed_time": "0:50:35", "remaining_time": "0:14:20", "throughput": 5683.29, "total_tokens": 17251648} {"current_steps": 26435, "total_steps": 33920, "loss": 0.3405, "lr": 1.4117469801044332e-06, "epoch": 15.586674528301886, "percentage": 77.93, "elapsed_time": "0:50:36", "remaining_time": "0:14:19", "throughput": 5683.41, "total_tokens": 17255744} {"current_steps": 26440, "total_steps": 33920, "loss": 0.3773, "lr": 1.4099558084898862e-06, "epoch": 15.589622641509434, "percentage": 77.95, "elapsed_time": "0:50:36", "remaining_time": "0:14:19", "throughput": 5683.44, "total_tokens": 17259040} {"current_steps": 26445, "total_steps": 33920, "loss": 0.2728, "lr": 1.408165587355011e-06, "epoch": 15.59257075471698, "percentage": 77.96, "elapsed_time": "0:50:37", "remaining_time": "0:14:18", "throughput": 5683.55, "total_tokens": 17262784} {"current_steps": 26450, "total_steps": 33920, "loss": 0.3395, "lr": 1.4063763171737766e-06, "epoch": 15.595518867924529, "percentage": 77.98, "elapsed_time": "0:50:37", "remaining_time": "0:14:17", "throughput": 5683.46, "total_tokens": 17265504} {"current_steps": 26455, "total_steps": 33920, "loss": 0.2791, "lr": 1.4045879984198996e-06, "epoch": 15.598466981132075, "percentage": 77.99, "elapsed_time": "0:50:38", "remaining_time": "0:14:17", "throughput": 5683.57, "total_tokens": 17269440} {"current_steps": 26460, "total_steps": 33920, "loss": 0.3203, "lr": 1.4028006315668457e-06, "epoch": 15.601415094339622, "percentage": 78.01, "elapsed_time": "0:50:39", "remaining_time": "0:14:16", "throughput": 5683.59, "total_tokens": 17272480} {"current_steps": 26465, "total_steps": 33920, "loss": 0.4486, "lr": 1.4010142170878261e-06, "epoch": 15.60436320754717, "percentage": 78.02, "elapsed_time": "0:50:39", "remaining_time": "0:14:16", "throughput": 5683.67, "total_tokens": 17275808} {"current_steps": 26470, "total_steps": 33920, "loss": 0.3875, "lr": 1.3992287554558042e-06, "epoch": 15.607311320754716, "percentage": 78.04, "elapsed_time": "0:50:40", "remaining_time": "0:14:15", "throughput": 5683.78, "total_tokens": 17279424} {"current_steps": 26475, "total_steps": 33920, "loss": 0.268, "lr": 1.3974442471434885e-06, "epoch": 15.610259433962264, "percentage": 78.05, "elapsed_time": "0:50:40", "remaining_time": "0:14:15", "throughput": 5683.69, "total_tokens": 17282080} {"current_steps": 26480, "total_steps": 33920, "loss": 0.3232, "lr": 1.395660692623334e-06, "epoch": 15.61320754716981, "percentage": 78.07, "elapsed_time": "0:50:41", "remaining_time": "0:14:14", "throughput": 5683.57, "total_tokens": 17284608} {"current_steps": 26485, "total_steps": 33920, "loss": 0.312, "lr": 1.3938780923675454e-06, "epoch": 15.616155660377359, "percentage": 78.08, "elapsed_time": "0:50:41", "remaining_time": "0:14:13", "throughput": 5683.53, "total_tokens": 17287328} {"current_steps": 26490, "total_steps": 33920, "loss": 0.3907, "lr": 1.3920964468480718e-06, "epoch": 15.619103773584905, "percentage": 78.1, "elapsed_time": "0:50:42", "remaining_time": "0:14:13", "throughput": 5683.33, "total_tokens": 17289856} {"current_steps": 26495, "total_steps": 33920, "loss": 0.2877, "lr": 1.3903157565366143e-06, "epoch": 15.622051886792454, "percentage": 78.11, "elapsed_time": "0:50:42", "remaining_time": "0:14:12", "throughput": 5683.3, "total_tokens": 17292736} {"current_steps": 26500, "total_steps": 33920, "loss": 0.3608, "lr": 1.3885360219046172e-06, "epoch": 15.625, "percentage": 78.12, "elapsed_time": "0:50:43", "remaining_time": "0:14:12", "throughput": 5683.34, "total_tokens": 17295968} {"current_steps": 26505, "total_steps": 33920, "loss": 0.3303, "lr": 1.386757243423273e-06, "epoch": 15.627948113207546, "percentage": 78.14, "elapsed_time": "0:50:43", "remaining_time": "0:14:11", "throughput": 5683.05, "total_tokens": 17298144} {"current_steps": 26510, "total_steps": 33920, "loss": 0.3568, "lr": 1.384979421563521e-06, "epoch": 15.630896226415095, "percentage": 78.15, "elapsed_time": "0:50:44", "remaining_time": "0:14:10", "throughput": 5683.05, "total_tokens": 17301184} {"current_steps": 26515, "total_steps": 33920, "loss": 0.4353, "lr": 1.3832025567960465e-06, "epoch": 15.633844339622641, "percentage": 78.17, "elapsed_time": "0:50:44", "remaining_time": "0:14:10", "throughput": 5682.98, "total_tokens": 17303808} {"current_steps": 26520, "total_steps": 33920, "loss": 0.3105, "lr": 1.3814266495912815e-06, "epoch": 15.63679245283019, "percentage": 78.18, "elapsed_time": "0:50:45", "remaining_time": "0:14:09", "throughput": 5682.96, "total_tokens": 17306784} {"current_steps": 26525, "total_steps": 33920, "loss": 0.3354, "lr": 1.3796517004194078e-06, "epoch": 15.639740566037736, "percentage": 78.2, "elapsed_time": "0:50:45", "remaining_time": "0:14:09", "throughput": 5683.03, "total_tokens": 17310432} {"current_steps": 26530, "total_steps": 33920, "loss": 0.3413, "lr": 1.3778777097503476e-06, "epoch": 15.642688679245284, "percentage": 78.21, "elapsed_time": "0:50:46", "remaining_time": "0:14:08", "throughput": 5682.93, "total_tokens": 17313152} {"current_steps": 26535, "total_steps": 33920, "loss": 0.2968, "lr": 1.3761046780537757e-06, "epoch": 15.64563679245283, "percentage": 78.23, "elapsed_time": "0:50:47", "remaining_time": "0:14:08", "throughput": 5682.82, "total_tokens": 17315680} {"current_steps": 26540, "total_steps": 33920, "loss": 0.1888, "lr": 1.3743326057991086e-06, "epoch": 15.648584905660378, "percentage": 78.24, "elapsed_time": "0:50:47", "remaining_time": "0:14:07", "throughput": 5682.86, "total_tokens": 17318880} {"current_steps": 26545, "total_steps": 33920, "loss": 0.3633, "lr": 1.3725614934555093e-06, "epoch": 15.651533018867925, "percentage": 78.26, "elapsed_time": "0:50:48", "remaining_time": "0:14:06", "throughput": 5682.84, "total_tokens": 17321728} {"current_steps": 26550, "total_steps": 33920, "loss": 0.2854, "lr": 1.3707913414918882e-06, "epoch": 15.654481132075471, "percentage": 78.27, "elapsed_time": "0:50:48", "remaining_time": "0:14:06", "throughput": 5682.78, "total_tokens": 17324896} {"current_steps": 26555, "total_steps": 33920, "loss": 0.2834, "lr": 1.3690221503768996e-06, "epoch": 15.65742924528302, "percentage": 78.29, "elapsed_time": "0:50:49", "remaining_time": "0:14:05", "throughput": 5682.9, "total_tokens": 17328448} {"current_steps": 26560, "total_steps": 33920, "loss": 0.4084, "lr": 1.3672539205789465e-06, "epoch": 15.660377358490566, "percentage": 78.3, "elapsed_time": "0:50:49", "remaining_time": "0:14:05", "throughput": 5683.02, "total_tokens": 17332224} {"current_steps": 26565, "total_steps": 33920, "loss": 0.3564, "lr": 1.3654866525661737e-06, "epoch": 15.663325471698114, "percentage": 78.32, "elapsed_time": "0:50:50", "remaining_time": "0:14:04", "throughput": 5682.86, "total_tokens": 17334624} {"current_steps": 26570, "total_steps": 33920, "loss": 0.4208, "lr": 1.3637203468064741e-06, "epoch": 15.66627358490566, "percentage": 78.33, "elapsed_time": "0:50:51", "remaining_time": "0:14:04", "throughput": 5683.15, "total_tokens": 17339936} {"current_steps": 26575, "total_steps": 33920, "loss": 0.3612, "lr": 1.3619550037674838e-06, "epoch": 15.669221698113208, "percentage": 78.35, "elapsed_time": "0:50:51", "remaining_time": "0:14:03", "throughput": 5683.12, "total_tokens": 17342720} {"current_steps": 26580, "total_steps": 33920, "loss": 0.3434, "lr": 1.3601906239165857e-06, "epoch": 15.672169811320755, "percentage": 78.36, "elapsed_time": "0:50:52", "remaining_time": "0:14:02", "throughput": 5683.19, "total_tokens": 17346464} {"current_steps": 26585, "total_steps": 33920, "loss": 0.4204, "lr": 1.3584272077209048e-06, "epoch": 15.675117924528301, "percentage": 78.38, "elapsed_time": "0:50:52", "remaining_time": "0:14:02", "throughput": 5683.16, "total_tokens": 17349600} {"current_steps": 26590, "total_steps": 33920, "loss": 0.2809, "lr": 1.3566647556473168e-06, "epoch": 15.67806603773585, "percentage": 78.39, "elapsed_time": "0:50:53", "remaining_time": "0:14:01", "throughput": 5683.03, "total_tokens": 17352512} {"current_steps": 26595, "total_steps": 33920, "loss": 0.3846, "lr": 1.3549032681624363e-06, "epoch": 15.681014150943396, "percentage": 78.41, "elapsed_time": "0:50:54", "remaining_time": "0:14:01", "throughput": 5683.26, "total_tokens": 17356896} {"current_steps": 26600, "total_steps": 33920, "loss": 0.2189, "lr": 1.3531427457326252e-06, "epoch": 15.683962264150944, "percentage": 78.42, "elapsed_time": "0:50:54", "remaining_time": "0:14:00", "throughput": 5683.31, "total_tokens": 17360160} {"current_steps": 26605, "total_steps": 33920, "loss": 0.3953, "lr": 1.3513831888239893e-06, "epoch": 15.68691037735849, "percentage": 78.43, "elapsed_time": "0:50:55", "remaining_time": "0:13:59", "throughput": 5683.42, "total_tokens": 17363488} {"current_steps": 26610, "total_steps": 33920, "loss": 0.2436, "lr": 1.3496245979023786e-06, "epoch": 15.689858490566039, "percentage": 78.45, "elapsed_time": "0:50:55", "remaining_time": "0:13:59", "throughput": 5683.52, "total_tokens": 17367296} {"current_steps": 26615, "total_steps": 33920, "loss": 0.3612, "lr": 1.3478669734333865e-06, "epoch": 15.692806603773585, "percentage": 78.46, "elapsed_time": "0:50:56", "remaining_time": "0:13:58", "throughput": 5683.67, "total_tokens": 17371008} {"current_steps": 26620, "total_steps": 33920, "loss": 0.3699, "lr": 1.3461103158823546e-06, "epoch": 15.695754716981131, "percentage": 78.48, "elapsed_time": "0:50:56", "remaining_time": "0:13:58", "throughput": 5683.78, "total_tokens": 17374304} {"current_steps": 26625, "total_steps": 33920, "loss": 0.2904, "lr": 1.3443546257143624e-06, "epoch": 15.69870283018868, "percentage": 78.49, "elapsed_time": "0:50:57", "remaining_time": "0:13:57", "throughput": 5683.81, "total_tokens": 17377344} {"current_steps": 26630, "total_steps": 33920, "loss": 0.3278, "lr": 1.3425999033942395e-06, "epoch": 15.701650943396226, "percentage": 78.51, "elapsed_time": "0:50:57", "remaining_time": "0:13:57", "throughput": 5683.79, "total_tokens": 17380032} {"current_steps": 26635, "total_steps": 33920, "loss": 0.3639, "lr": 1.3408461493865549e-06, "epoch": 15.704599056603774, "percentage": 78.52, "elapsed_time": "0:50:58", "remaining_time": "0:13:56", "throughput": 5683.64, "total_tokens": 17382336} {"current_steps": 26640, "total_steps": 33920, "loss": 0.4187, "lr": 1.339093364155622e-06, "epoch": 15.70754716981132, "percentage": 78.54, "elapsed_time": "0:50:58", "remaining_time": "0:13:55", "throughput": 5683.72, "total_tokens": 17385664} {"current_steps": 26645, "total_steps": 33920, "loss": 0.4071, "lr": 1.3373415481654988e-06, "epoch": 15.710495283018869, "percentage": 78.55, "elapsed_time": "0:50:59", "remaining_time": "0:13:55", "throughput": 5683.85, "total_tokens": 17389056} {"current_steps": 26650, "total_steps": 33920, "loss": 0.3444, "lr": 1.335590701879984e-06, "epoch": 15.713443396226415, "percentage": 78.57, "elapsed_time": "0:50:59", "remaining_time": "0:13:54", "throughput": 5683.86, "total_tokens": 17391936} {"current_steps": 26655, "total_steps": 33920, "loss": 0.2407, "lr": 1.3338408257626257e-06, "epoch": 15.716391509433961, "percentage": 78.58, "elapsed_time": "0:51:00", "remaining_time": "0:13:54", "throughput": 5684.1, "total_tokens": 17396832} {"current_steps": 26660, "total_steps": 33920, "loss": 0.2513, "lr": 1.3320919202767086e-06, "epoch": 15.71933962264151, "percentage": 78.6, "elapsed_time": "0:51:01", "remaining_time": "0:13:53", "throughput": 5683.97, "total_tokens": 17399232} {"current_steps": 26665, "total_steps": 33920, "loss": 0.3838, "lr": 1.3303439858852636e-06, "epoch": 15.722287735849056, "percentage": 78.61, "elapsed_time": "0:51:01", "remaining_time": "0:13:53", "throughput": 5684.09, "total_tokens": 17402624} {"current_steps": 26670, "total_steps": 33920, "loss": 0.3655, "lr": 1.3285970230510636e-06, "epoch": 15.725235849056604, "percentage": 78.63, "elapsed_time": "0:51:02", "remaining_time": "0:13:52", "throughput": 5684.07, "total_tokens": 17406016} {"current_steps": 26675, "total_steps": 33920, "loss": 0.3531, "lr": 1.3268510322366246e-06, "epoch": 15.72818396226415, "percentage": 78.64, "elapsed_time": "0:51:02", "remaining_time": "0:13:51", "throughput": 5684.09, "total_tokens": 17408928} {"current_steps": 26680, "total_steps": 33920, "loss": 0.2431, "lr": 1.3251060139042038e-06, "epoch": 15.731132075471699, "percentage": 78.66, "elapsed_time": "0:51:03", "remaining_time": "0:13:51", "throughput": 5684.18, "total_tokens": 17412096} {"current_steps": 26685, "total_steps": 33920, "loss": 0.3417, "lr": 1.3233619685158056e-06, "epoch": 15.734080188679245, "percentage": 78.67, "elapsed_time": "0:51:03", "remaining_time": "0:13:50", "throughput": 5684.16, "total_tokens": 17414816} {"current_steps": 26690, "total_steps": 33920, "loss": 0.3285, "lr": 1.3216188965331712e-06, "epoch": 15.737028301886792, "percentage": 78.69, "elapsed_time": "0:51:04", "remaining_time": "0:13:50", "throughput": 5684.12, "total_tokens": 17417376} {"current_steps": 26695, "total_steps": 33920, "loss": 0.3344, "lr": 1.3198767984177869e-06, "epoch": 15.73997641509434, "percentage": 78.7, "elapsed_time": "0:51:04", "remaining_time": "0:13:49", "throughput": 5684.18, "total_tokens": 17420384} {"current_steps": 26700, "total_steps": 33920, "loss": 0.3501, "lr": 1.3181356746308805e-06, "epoch": 15.742924528301886, "percentage": 78.71, "elapsed_time": "0:51:05", "remaining_time": "0:13:48", "throughput": 5684.31, "total_tokens": 17423840} {"current_steps": 26705, "total_steps": 33920, "loss": 0.2717, "lr": 1.3163955256334226e-06, "epoch": 15.745872641509434, "percentage": 78.73, "elapsed_time": "0:51:05", "remaining_time": "0:13:48", "throughput": 5684.29, "total_tokens": 17426784} {"current_steps": 26710, "total_steps": 33920, "loss": 0.3016, "lr": 1.3146563518861227e-06, "epoch": 15.74882075471698, "percentage": 78.74, "elapsed_time": "0:51:06", "remaining_time": "0:13:47", "throughput": 5684.4, "total_tokens": 17430080} {"current_steps": 26715, "total_steps": 33920, "loss": 0.2567, "lr": 1.3129181538494384e-06, "epoch": 15.751768867924529, "percentage": 78.76, "elapsed_time": "0:51:06", "remaining_time": "0:13:47", "throughput": 5684.4, "total_tokens": 17432768} {"current_steps": 26720, "total_steps": 33920, "loss": 0.3205, "lr": 1.3111809319835622e-06, "epoch": 15.754716981132075, "percentage": 78.77, "elapsed_time": "0:51:07", "remaining_time": "0:13:46", "throughput": 5684.64, "total_tokens": 17437504} {"current_steps": 26725, "total_steps": 33920, "loss": 0.3815, "lr": 1.3094446867484335e-06, "epoch": 15.757665094339622, "percentage": 78.79, "elapsed_time": "0:51:07", "remaining_time": "0:13:45", "throughput": 5684.7, "total_tokens": 17440448} {"current_steps": 26730, "total_steps": 33920, "loss": 0.4823, "lr": 1.3077094186037287e-06, "epoch": 15.76061320754717, "percentage": 78.8, "elapsed_time": "0:51:08", "remaining_time": "0:13:45", "throughput": 5684.74, "total_tokens": 17443392} {"current_steps": 26735, "total_steps": 33920, "loss": 0.4009, "lr": 1.305975128008869e-06, "epoch": 15.763561320754716, "percentage": 78.82, "elapsed_time": "0:51:08", "remaining_time": "0:13:44", "throughput": 5684.64, "total_tokens": 17445824} {"current_steps": 26740, "total_steps": 33920, "loss": 0.3692, "lr": 1.304241815423014e-06, "epoch": 15.766509433962264, "percentage": 78.83, "elapsed_time": "0:51:09", "remaining_time": "0:13:44", "throughput": 5684.64, "total_tokens": 17448800} {"current_steps": 26745, "total_steps": 33920, "loss": 0.3118, "lr": 1.3025094813050655e-06, "epoch": 15.76945754716981, "percentage": 78.85, "elapsed_time": "0:51:10", "remaining_time": "0:13:43", "throughput": 5684.64, "total_tokens": 17451872} {"current_steps": 26750, "total_steps": 33920, "loss": 0.35, "lr": 1.3007781261136675e-06, "epoch": 15.772405660377359, "percentage": 78.86, "elapsed_time": "0:51:10", "remaining_time": "0:13:43", "throughput": 5684.72, "total_tokens": 17455584} {"current_steps": 26755, "total_steps": 33920, "loss": 0.3432, "lr": 1.299047750307204e-06, "epoch": 15.775353773584905, "percentage": 78.88, "elapsed_time": "0:51:11", "remaining_time": "0:13:42", "throughput": 5684.86, "total_tokens": 17459648} {"current_steps": 26760, "total_steps": 33920, "loss": 0.2918, "lr": 1.297318354343799e-06, "epoch": 15.778301886792454, "percentage": 78.89, "elapsed_time": "0:51:11", "remaining_time": "0:13:41", "throughput": 5684.79, "total_tokens": 17462528} {"current_steps": 26765, "total_steps": 33920, "loss": 0.3034, "lr": 1.295589938681317e-06, "epoch": 15.78125, "percentage": 78.91, "elapsed_time": "0:51:12", "remaining_time": "0:13:41", "throughput": 5684.91, "total_tokens": 17466592} {"current_steps": 26770, "total_steps": 33920, "loss": 0.3418, "lr": 1.2938625037773628e-06, "epoch": 15.784198113207546, "percentage": 78.92, "elapsed_time": "0:51:13", "remaining_time": "0:13:40", "throughput": 5685.05, "total_tokens": 17470240} {"current_steps": 26775, "total_steps": 33920, "loss": 0.2628, "lr": 1.2921360500892843e-06, "epoch": 15.787146226415095, "percentage": 78.94, "elapsed_time": "0:51:13", "remaining_time": "0:13:40", "throughput": 5685.19, "total_tokens": 17474080} {"current_steps": 26780, "total_steps": 33920, "loss": 0.3553, "lr": 1.290410578074167e-06, "epoch": 15.790094339622641, "percentage": 78.95, "elapsed_time": "0:51:14", "remaining_time": "0:13:39", "throughput": 5685.17, "total_tokens": 17476928} {"current_steps": 26785, "total_steps": 33920, "loss": 0.3007, "lr": 1.2886860881888362e-06, "epoch": 15.79304245283019, "percentage": 78.97, "elapsed_time": "0:51:14", "remaining_time": "0:13:39", "throughput": 5685.17, "total_tokens": 17480256} {"current_steps": 26790, "total_steps": 33920, "loss": 0.2926, "lr": 1.2869625808898584e-06, "epoch": 15.795990566037736, "percentage": 78.98, "elapsed_time": "0:51:15", "remaining_time": "0:13:38", "throughput": 5685.15, "total_tokens": 17483168} {"current_steps": 26795, "total_steps": 33920, "loss": 0.5848, "lr": 1.2852400566335398e-06, "epoch": 15.798938679245284, "percentage": 78.99, "elapsed_time": "0:51:15", "remaining_time": "0:13:37", "throughput": 5685.21, "total_tokens": 17487360} {"current_steps": 26800, "total_steps": 33920, "loss": 0.3643, "lr": 1.2835185158759244e-06, "epoch": 15.80188679245283, "percentage": 79.01, "elapsed_time": "0:51:16", "remaining_time": "0:13:37", "throughput": 5685.4, "total_tokens": 17491648} {"current_steps": 26805, "total_steps": 33920, "loss": 0.3023, "lr": 1.2817979590728009e-06, "epoch": 15.804834905660378, "percentage": 79.02, "elapsed_time": "0:51:17", "remaining_time": "0:13:36", "throughput": 5685.36, "total_tokens": 17494464} {"current_steps": 26810, "total_steps": 33920, "loss": 0.3423, "lr": 1.2800783866796918e-06, "epoch": 15.807783018867925, "percentage": 79.04, "elapsed_time": "0:51:17", "remaining_time": "0:13:36", "throughput": 5685.28, "total_tokens": 17497280} {"current_steps": 26815, "total_steps": 33920, "loss": 0.363, "lr": 1.2783597991518604e-06, "epoch": 15.810731132075471, "percentage": 79.05, "elapsed_time": "0:51:18", "remaining_time": "0:13:35", "throughput": 5685.39, "total_tokens": 17500704} {"current_steps": 26820, "total_steps": 33920, "loss": 0.3457, "lr": 1.2766421969443131e-06, "epoch": 15.81367924528302, "percentage": 79.07, "elapsed_time": "0:51:18", "remaining_time": "0:13:35", "throughput": 5685.48, "total_tokens": 17504192} {"current_steps": 26825, "total_steps": 33920, "loss": 0.2919, "lr": 1.274925580511791e-06, "epoch": 15.816627358490566, "percentage": 79.08, "elapsed_time": "0:51:19", "remaining_time": "0:13:34", "throughput": 5685.59, "total_tokens": 17507808} {"current_steps": 26830, "total_steps": 33920, "loss": 0.1826, "lr": 1.2732099503087757e-06, "epoch": 15.819575471698114, "percentage": 79.1, "elapsed_time": "0:51:19", "remaining_time": "0:13:33", "throughput": 5685.68, "total_tokens": 17511488} {"current_steps": 26835, "total_steps": 33920, "loss": 0.2992, "lr": 1.2714953067894859e-06, "epoch": 15.82252358490566, "percentage": 79.11, "elapsed_time": "0:51:20", "remaining_time": "0:13:33", "throughput": 5685.63, "total_tokens": 17514240} {"current_steps": 26840, "total_steps": 33920, "loss": 0.2914, "lr": 1.2697816504078847e-06, "epoch": 15.825471698113208, "percentage": 79.13, "elapsed_time": "0:51:20", "remaining_time": "0:13:32", "throughput": 5685.57, "total_tokens": 17517024} {"current_steps": 26845, "total_steps": 33920, "loss": 0.4058, "lr": 1.2680689816176672e-06, "epoch": 15.828419811320755, "percentage": 79.14, "elapsed_time": "0:51:21", "remaining_time": "0:13:32", "throughput": 5685.43, "total_tokens": 17519616} {"current_steps": 26850, "total_steps": 33920, "loss": 0.3124, "lr": 1.2663573008722707e-06, "epoch": 15.831367924528301, "percentage": 79.16, "elapsed_time": "0:51:22", "remaining_time": "0:13:31", "throughput": 5685.46, "total_tokens": 17523072} {"current_steps": 26855, "total_steps": 33920, "loss": 0.2789, "lr": 1.2646466086248698e-06, "epoch": 15.83431603773585, "percentage": 79.17, "elapsed_time": "0:51:22", "remaining_time": "0:13:30", "throughput": 5685.33, "total_tokens": 17525568} {"current_steps": 26860, "total_steps": 33920, "loss": 0.3958, "lr": 1.2629369053283779e-06, "epoch": 15.837264150943396, "percentage": 79.19, "elapsed_time": "0:51:23", "remaining_time": "0:13:30", "throughput": 5685.36, "total_tokens": 17528480} {"current_steps": 26865, "total_steps": 33920, "loss": 0.2362, "lr": 1.2612281914354452e-06, "epoch": 15.840212264150944, "percentage": 79.2, "elapsed_time": "0:51:23", "remaining_time": "0:13:29", "throughput": 5685.29, "total_tokens": 17531168} {"current_steps": 26870, "total_steps": 33920, "loss": 0.3053, "lr": 1.259520467398463e-06, "epoch": 15.84316037735849, "percentage": 79.22, "elapsed_time": "0:51:24", "remaining_time": "0:13:29", "throughput": 5685.34, "total_tokens": 17534560} {"current_steps": 26875, "total_steps": 33920, "loss": 0.2452, "lr": 1.2578137336695573e-06, "epoch": 15.846108490566039, "percentage": 79.23, "elapsed_time": "0:51:24", "remaining_time": "0:13:28", "throughput": 5685.32, "total_tokens": 17537280} {"current_steps": 26880, "total_steps": 33920, "loss": 0.3069, "lr": 1.256107990700594e-06, "epoch": 15.849056603773585, "percentage": 79.25, "elapsed_time": "0:51:25", "remaining_time": "0:13:28", "throughput": 5685.26, "total_tokens": 17540320} {"current_steps": 26885, "total_steps": 33920, "loss": 0.3686, "lr": 1.2544032389431753e-06, "epoch": 15.852004716981131, "percentage": 79.26, "elapsed_time": "0:51:25", "remaining_time": "0:13:27", "throughput": 5685.25, "total_tokens": 17543264} {"current_steps": 26890, "total_steps": 33920, "loss": 0.245, "lr": 1.2526994788486418e-06, "epoch": 15.85495283018868, "percentage": 79.27, "elapsed_time": "0:51:26", "remaining_time": "0:13:26", "throughput": 5685.25, "total_tokens": 17546176} {"current_steps": 26895, "total_steps": 33920, "loss": 0.3591, "lr": 1.2509967108680697e-06, "epoch": 15.857900943396226, "percentage": 79.29, "elapsed_time": "0:51:26", "remaining_time": "0:13:26", "throughput": 5685.25, "total_tokens": 17549344} {"current_steps": 26900, "total_steps": 33920, "loss": 0.3506, "lr": 1.249294935452277e-06, "epoch": 15.860849056603774, "percentage": 79.3, "elapsed_time": "0:51:27", "remaining_time": "0:13:25", "throughput": 5685.48, "total_tokens": 17553984} {"current_steps": 26905, "total_steps": 33920, "loss": 0.1985, "lr": 1.247594153051815e-06, "epoch": 15.86379716981132, "percentage": 79.32, "elapsed_time": "0:51:28", "remaining_time": "0:13:25", "throughput": 5685.81, "total_tokens": 17560768} {"current_steps": 26910, "total_steps": 33920, "loss": 0.3016, "lr": 1.2458943641169718e-06, "epoch": 15.866745283018869, "percentage": 79.33, "elapsed_time": "0:51:29", "remaining_time": "0:13:24", "throughput": 5685.84, "total_tokens": 17563744} {"current_steps": 26915, "total_steps": 33920, "loss": 0.2823, "lr": 1.2441955690977758e-06, "epoch": 15.869693396226415, "percentage": 79.35, "elapsed_time": "0:51:29", "remaining_time": "0:13:24", "throughput": 5685.94, "total_tokens": 17567168} {"current_steps": 26920, "total_steps": 33920, "loss": 0.3532, "lr": 1.2424977684439898e-06, "epoch": 15.872641509433961, "percentage": 79.36, "elapsed_time": "0:51:30", "remaining_time": "0:13:23", "throughput": 5685.92, "total_tokens": 17570528} {"current_steps": 26925, "total_steps": 33920, "loss": 0.3773, "lr": 1.2408009626051137e-06, "epoch": 15.87558962264151, "percentage": 79.38, "elapsed_time": "0:51:30", "remaining_time": "0:13:22", "throughput": 5685.9, "total_tokens": 17573440} {"current_steps": 26930, "total_steps": 33920, "loss": 0.2489, "lr": 1.2391051520303826e-06, "epoch": 15.878537735849056, "percentage": 79.39, "elapsed_time": "0:51:31", "remaining_time": "0:13:22", "throughput": 5685.99, "total_tokens": 17576736} {"current_steps": 26935, "total_steps": 33920, "loss": 0.4045, "lr": 1.2374103371687723e-06, "epoch": 15.881485849056604, "percentage": 79.41, "elapsed_time": "0:51:31", "remaining_time": "0:13:21", "throughput": 5686.02, "total_tokens": 17579936} {"current_steps": 26940, "total_steps": 33920, "loss": 0.2868, "lr": 1.2357165184689906e-06, "epoch": 15.88443396226415, "percentage": 79.42, "elapsed_time": "0:51:32", "remaining_time": "0:13:21", "throughput": 5686.1, "total_tokens": 17583200} {"current_steps": 26945, "total_steps": 33920, "loss": 0.2296, "lr": 1.2340236963794845e-06, "epoch": 15.887382075471699, "percentage": 79.44, "elapsed_time": "0:51:32", "remaining_time": "0:13:20", "throughput": 5686.09, "total_tokens": 17586144} {"current_steps": 26950, "total_steps": 33920, "loss": 0.3663, "lr": 1.232331871348435e-06, "epoch": 15.890330188679245, "percentage": 79.45, "elapsed_time": "0:51:33", "remaining_time": "0:13:20", "throughput": 5686.07, "total_tokens": 17588992} {"current_steps": 26955, "total_steps": 33920, "loss": 0.388, "lr": 1.2306410438237603e-06, "epoch": 15.893278301886792, "percentage": 79.47, "elapsed_time": "0:51:33", "remaining_time": "0:13:19", "throughput": 5686.03, "total_tokens": 17591744} {"current_steps": 26960, "total_steps": 33920, "loss": 0.3444, "lr": 1.228951214253113e-06, "epoch": 15.89622641509434, "percentage": 79.48, "elapsed_time": "0:51:34", "remaining_time": "0:13:18", "throughput": 5686.2, "total_tokens": 17595616} {"current_steps": 26965, "total_steps": 33920, "loss": 0.3375, "lr": 1.2272623830838854e-06, "epoch": 15.899174528301886, "percentage": 79.5, "elapsed_time": "0:51:34", "remaining_time": "0:13:18", "throughput": 5686.3, "total_tokens": 17598880} {"current_steps": 26970, "total_steps": 33920, "loss": 0.2687, "lr": 1.2255745507632016e-06, "epoch": 15.902122641509434, "percentage": 79.51, "elapsed_time": "0:51:35", "remaining_time": "0:13:17", "throughput": 5686.28, "total_tokens": 17602240} {"current_steps": 26975, "total_steps": 33920, "loss": 0.2864, "lr": 1.223887717737922e-06, "epoch": 15.90507075471698, "percentage": 79.53, "elapsed_time": "0:51:36", "remaining_time": "0:13:17", "throughput": 5686.23, "total_tokens": 17605824} {"current_steps": 26980, "total_steps": 33920, "loss": 0.245, "lr": 1.2222018844546434e-06, "epoch": 15.908018867924529, "percentage": 79.54, "elapsed_time": "0:51:36", "remaining_time": "0:13:16", "throughput": 5686.27, "total_tokens": 17609248} {"current_steps": 26985, "total_steps": 33920, "loss": 0.3283, "lr": 1.2205170513596975e-06, "epoch": 15.910966981132075, "percentage": 79.55, "elapsed_time": "0:51:37", "remaining_time": "0:13:15", "throughput": 5686.38, "total_tokens": 17612640} {"current_steps": 26990, "total_steps": 33920, "loss": 0.2401, "lr": 1.2188332188991493e-06, "epoch": 15.913915094339622, "percentage": 79.57, "elapsed_time": "0:51:37", "remaining_time": "0:13:15", "throughput": 5686.29, "total_tokens": 17615680} {"current_steps": 26995, "total_steps": 33920, "loss": 0.3587, "lr": 1.217150387518804e-06, "epoch": 15.91686320754717, "percentage": 79.58, "elapsed_time": "0:51:38", "remaining_time": "0:13:14", "throughput": 5686.3, "total_tokens": 17618656} {"current_steps": 27000, "total_steps": 33920, "loss": 0.4361, "lr": 1.2154685576641967e-06, "epoch": 15.919811320754716, "percentage": 79.6, "elapsed_time": "0:51:38", "remaining_time": "0:13:14", "throughput": 5686.18, "total_tokens": 17621344} {"current_steps": 27005, "total_steps": 33920, "loss": 0.2664, "lr": 1.2137877297805972e-06, "epoch": 15.922759433962264, "percentage": 79.61, "elapsed_time": "0:51:39", "remaining_time": "0:13:13", "throughput": 5686.16, "total_tokens": 17625088} {"current_steps": 27010, "total_steps": 33920, "loss": 0.3389, "lr": 1.2121079043130162e-06, "epoch": 15.92570754716981, "percentage": 79.63, "elapsed_time": "0:51:40", "remaining_time": "0:13:13", "throughput": 5686.4, "total_tokens": 17632320} {"current_steps": 27015, "total_steps": 33920, "loss": 0.3491, "lr": 1.210429081706192e-06, "epoch": 15.928655660377359, "percentage": 79.64, "elapsed_time": "0:51:41", "remaining_time": "0:13:12", "throughput": 5686.35, "total_tokens": 17635072} {"current_steps": 27020, "total_steps": 33920, "loss": 0.4026, "lr": 1.2087512624046005e-06, "epoch": 15.931603773584905, "percentage": 79.66, "elapsed_time": "0:51:41", "remaining_time": "0:13:12", "throughput": 5686.38, "total_tokens": 17638304} {"current_steps": 27025, "total_steps": 33920, "loss": 0.3374, "lr": 1.2070744468524503e-06, "epoch": 15.934551886792454, "percentage": 79.67, "elapsed_time": "0:51:42", "remaining_time": "0:13:11", "throughput": 5686.36, "total_tokens": 17641216} {"current_steps": 27030, "total_steps": 33920, "loss": 0.2618, "lr": 1.2053986354936887e-06, "epoch": 15.9375, "percentage": 79.69, "elapsed_time": "0:51:42", "remaining_time": "0:13:10", "throughput": 5686.43, "total_tokens": 17644576} {"current_steps": 27035, "total_steps": 33920, "loss": 0.283, "lr": 1.2037238287719916e-06, "epoch": 15.940448113207546, "percentage": 79.7, "elapsed_time": "0:51:43", "remaining_time": "0:13:10", "throughput": 5686.42, "total_tokens": 17647648} {"current_steps": 27040, "total_steps": 33920, "loss": 0.3916, "lr": 1.2020500271307721e-06, "epoch": 15.943396226415095, "percentage": 79.72, "elapsed_time": "0:51:44", "remaining_time": "0:13:09", "throughput": 5686.46, "total_tokens": 17651040} {"current_steps": 27045, "total_steps": 33920, "loss": 0.4676, "lr": 1.200377231013176e-06, "epoch": 15.946344339622641, "percentage": 79.73, "elapsed_time": "0:51:44", "remaining_time": "0:13:09", "throughput": 5686.41, "total_tokens": 17653728} {"current_steps": 27050, "total_steps": 33920, "loss": 0.4361, "lr": 1.1987054408620825e-06, "epoch": 15.94929245283019, "percentage": 79.75, "elapsed_time": "0:51:45", "remaining_time": "0:13:08", "throughput": 5686.24, "total_tokens": 17656352} {"current_steps": 27055, "total_steps": 33920, "loss": 0.3539, "lr": 1.197034657120107e-06, "epoch": 15.952240566037736, "percentage": 79.76, "elapsed_time": "0:51:46", "remaining_time": "0:13:08", "throughput": 5686.45, "total_tokens": 17662432} {"current_steps": 27060, "total_steps": 33920, "loss": 0.2473, "lr": 1.1953648802295964e-06, "epoch": 15.955188679245284, "percentage": 79.78, "elapsed_time": "0:51:46", "remaining_time": "0:13:07", "throughput": 5686.55, "total_tokens": 17665888} {"current_steps": 27065, "total_steps": 33920, "loss": 0.278, "lr": 1.1936961106326307e-06, "epoch": 15.95813679245283, "percentage": 79.79, "elapsed_time": "0:51:47", "remaining_time": "0:13:06", "throughput": 5686.57, "total_tokens": 17669056} {"current_steps": 27070, "total_steps": 33920, "loss": 0.256, "lr": 1.1920283487710237e-06, "epoch": 15.961084905660378, "percentage": 79.81, "elapsed_time": "0:51:47", "remaining_time": "0:13:06", "throughput": 5686.3, "total_tokens": 17671200} {"current_steps": 27075, "total_steps": 33920, "loss": 0.2659, "lr": 1.1903615950863228e-06, "epoch": 15.964033018867925, "percentage": 79.82, "elapsed_time": "0:51:48", "remaining_time": "0:13:05", "throughput": 5686.23, "total_tokens": 17673856} {"current_steps": 27080, "total_steps": 33920, "loss": 0.3612, "lr": 1.1886958500198076e-06, "epoch": 15.966981132075471, "percentage": 79.83, "elapsed_time": "0:51:48", "remaining_time": "0:13:05", "throughput": 5686.33, "total_tokens": 17677280} {"current_steps": 27085, "total_steps": 33920, "loss": 0.3786, "lr": 1.1870311140124923e-06, "epoch": 15.96992924528302, "percentage": 79.85, "elapsed_time": "0:51:49", "remaining_time": "0:13:04", "throughput": 5686.39, "total_tokens": 17680800} {"current_steps": 27090, "total_steps": 33920, "loss": 0.3165, "lr": 1.185367387505123e-06, "epoch": 15.972877358490566, "percentage": 79.86, "elapsed_time": "0:51:49", "remaining_time": "0:13:04", "throughput": 5686.33, "total_tokens": 17683520} {"current_steps": 27095, "total_steps": 33920, "loss": 0.6599, "lr": 1.1837046709381783e-06, "epoch": 15.975825471698114, "percentage": 79.88, "elapsed_time": "0:51:50", "remaining_time": "0:13:03", "throughput": 5686.24, "total_tokens": 17686272} {"current_steps": 27100, "total_steps": 33920, "loss": 0.2871, "lr": 1.1820429647518678e-06, "epoch": 15.97877358490566, "percentage": 79.89, "elapsed_time": "0:51:50", "remaining_time": "0:13:02", "throughput": 5686.32, "total_tokens": 17689952} {"current_steps": 27105, "total_steps": 33920, "loss": 0.3556, "lr": 1.1803822693861377e-06, "epoch": 15.981721698113208, "percentage": 79.91, "elapsed_time": "0:51:51", "remaining_time": "0:13:02", "throughput": 5686.18, "total_tokens": 17692672} {"current_steps": 27110, "total_steps": 33920, "loss": 0.2598, "lr": 1.1787225852806639e-06, "epoch": 15.984669811320755, "percentage": 79.92, "elapsed_time": "0:51:52", "remaining_time": "0:13:01", "throughput": 5686.1, "total_tokens": 17695712} {"current_steps": 27115, "total_steps": 33920, "loss": 0.3386, "lr": 1.177063912874853e-06, "epoch": 15.987617924528301, "percentage": 79.94, "elapsed_time": "0:51:52", "remaining_time": "0:13:01", "throughput": 5685.98, "total_tokens": 17698400} {"current_steps": 27120, "total_steps": 33920, "loss": 0.537, "lr": 1.1754062526078487e-06, "epoch": 15.99056603773585, "percentage": 79.95, "elapsed_time": "0:51:53", "remaining_time": "0:13:00", "throughput": 5686.01, "total_tokens": 17701856} {"current_steps": 27125, "total_steps": 33920, "loss": 0.3308, "lr": 1.1737496049185215e-06, "epoch": 15.993514150943396, "percentage": 79.97, "elapsed_time": "0:51:53", "remaining_time": "0:13:00", "throughput": 5685.96, "total_tokens": 17704864} {"current_steps": 27130, "total_steps": 33920, "loss": 0.3565, "lr": 1.172093970245477e-06, "epoch": 15.996462264150944, "percentage": 79.98, "elapsed_time": "0:51:54", "remaining_time": "0:12:59", "throughput": 5686.0, "total_tokens": 17708480} {"current_steps": 27135, "total_steps": 33920, "loss": 0.3286, "lr": 1.1704393490270516e-06, "epoch": 15.99941037735849, "percentage": 80.0, "elapsed_time": "0:51:54", "remaining_time": "0:12:58", "throughput": 5686.06, "total_tokens": 17712032} {"current_steps": 27136, "total_steps": 33920, "eval_loss": 0.6074872016906738, "epoch": 16.0, "percentage": 80.0, "elapsed_time": "0:52:14", "remaining_time": "0:13:03", "throughput": 5650.69, "total_tokens": 17712104} {"current_steps": 27140, "total_steps": 33920, "loss": 0.2119, "lr": 1.1687857417013126e-06, "epoch": 16.00235849056604, "percentage": 80.01, "elapsed_time": "0:52:18", "remaining_time": "0:13:04", "throughput": 5644.65, "total_tokens": 17715048} {"current_steps": 27145, "total_steps": 33920, "loss": 0.3081, "lr": 1.1671331487060583e-06, "epoch": 16.005306603773583, "percentage": 80.03, "elapsed_time": "0:52:18", "remaining_time": "0:13:03", "throughput": 5644.6, "total_tokens": 17717992} {"current_steps": 27150, "total_steps": 33920, "loss": 0.3316, "lr": 1.1654815704788237e-06, "epoch": 16.00825471698113, "percentage": 80.04, "elapsed_time": "0:52:19", "remaining_time": "0:13:02", "throughput": 5644.28, "total_tokens": 17720328} {"current_steps": 27155, "total_steps": 33920, "loss": 0.2589, "lr": 1.1638310074568687e-06, "epoch": 16.01120283018868, "percentage": 80.06, "elapsed_time": "0:52:20", "remaining_time": "0:13:02", "throughput": 5644.35, "total_tokens": 17723880} {"current_steps": 27160, "total_steps": 33920, "loss": 0.2891, "lr": 1.162181460077188e-06, "epoch": 16.014150943396228, "percentage": 80.07, "elapsed_time": "0:52:20", "remaining_time": "0:13:01", "throughput": 5644.49, "total_tokens": 17727944} {"current_steps": 27165, "total_steps": 33920, "loss": 0.2962, "lr": 1.1605329287765056e-06, "epoch": 16.017099056603772, "percentage": 80.09, "elapsed_time": "0:52:21", "remaining_time": "0:13:01", "throughput": 5644.67, "total_tokens": 17731848} {"current_steps": 27170, "total_steps": 33920, "loss": 0.2633, "lr": 1.1588854139912775e-06, "epoch": 16.02004716981132, "percentage": 80.1, "elapsed_time": "0:52:21", "remaining_time": "0:13:00", "throughput": 5644.51, "total_tokens": 17734536} {"current_steps": 27175, "total_steps": 33920, "loss": 0.2476, "lr": 1.1572389161576886e-06, "epoch": 16.02299528301887, "percentage": 80.11, "elapsed_time": "0:52:22", "remaining_time": "0:12:59", "throughput": 5644.66, "total_tokens": 17738312} {"current_steps": 27180, "total_steps": 33920, "loss": 0.4312, "lr": 1.15559343571166e-06, "epoch": 16.025943396226417, "percentage": 80.13, "elapsed_time": "0:52:23", "remaining_time": "0:12:59", "throughput": 5644.72, "total_tokens": 17741480} {"current_steps": 27185, "total_steps": 33920, "loss": 0.3601, "lr": 1.153948973088837e-06, "epoch": 16.02889150943396, "percentage": 80.14, "elapsed_time": "0:52:23", "remaining_time": "0:12:58", "throughput": 5644.63, "total_tokens": 17744520} {"current_steps": 27190, "total_steps": 33920, "loss": 0.2473, "lr": 1.1523055287245993e-06, "epoch": 16.03183962264151, "percentage": 80.16, "elapsed_time": "0:52:24", "remaining_time": "0:12:58", "throughput": 5644.53, "total_tokens": 17747080} {"current_steps": 27195, "total_steps": 33920, "loss": 0.3196, "lr": 1.150663103054056e-06, "epoch": 16.034787735849058, "percentage": 80.17, "elapsed_time": "0:52:24", "remaining_time": "0:12:57", "throughput": 5644.59, "total_tokens": 17750632} {"current_steps": 27200, "total_steps": 33920, "loss": 0.2132, "lr": 1.1490216965120438e-06, "epoch": 16.037735849056602, "percentage": 80.19, "elapsed_time": "0:52:25", "remaining_time": "0:12:57", "throughput": 5644.51, "total_tokens": 17753864} {"current_steps": 27205, "total_steps": 33920, "loss": 0.3224, "lr": 1.147381309533136e-06, "epoch": 16.04068396226415, "percentage": 80.2, "elapsed_time": "0:52:25", "remaining_time": "0:12:56", "throughput": 5644.44, "total_tokens": 17756744} {"current_steps": 27210, "total_steps": 33920, "loss": 0.2373, "lr": 1.1457419425516287e-06, "epoch": 16.0436320754717, "percentage": 80.22, "elapsed_time": "0:52:26", "remaining_time": "0:12:55", "throughput": 5644.38, "total_tokens": 17759720} {"current_steps": 27215, "total_steps": 33920, "loss": 0.3176, "lr": 1.1441035960015544e-06, "epoch": 16.046580188679247, "percentage": 80.23, "elapsed_time": "0:52:26", "remaining_time": "0:12:55", "throughput": 5644.38, "total_tokens": 17762792} {"current_steps": 27220, "total_steps": 33920, "loss": 0.2959, "lr": 1.1424662703166716e-06, "epoch": 16.04952830188679, "percentage": 80.25, "elapsed_time": "0:52:27", "remaining_time": "0:12:54", "throughput": 5644.4, "total_tokens": 17765960} {"current_steps": 27225, "total_steps": 33920, "loss": 0.4118, "lr": 1.1408299659304684e-06, "epoch": 16.05247641509434, "percentage": 80.26, "elapsed_time": "0:52:28", "remaining_time": "0:12:54", "throughput": 5644.48, "total_tokens": 17769160} {"current_steps": 27230, "total_steps": 33920, "loss": 0.2657, "lr": 1.1391946832761642e-06, "epoch": 16.055424528301888, "percentage": 80.28, "elapsed_time": "0:52:28", "remaining_time": "0:12:53", "throughput": 5644.55, "total_tokens": 17772424} {"current_steps": 27235, "total_steps": 33920, "loss": 0.2424, "lr": 1.137560422786706e-06, "epoch": 16.058372641509433, "percentage": 80.29, "elapsed_time": "0:52:29", "remaining_time": "0:12:52", "throughput": 5644.52, "total_tokens": 17775336} {"current_steps": 27240, "total_steps": 33920, "loss": 0.3095, "lr": 1.1359271848947712e-06, "epoch": 16.06132075471698, "percentage": 80.31, "elapsed_time": "0:52:29", "remaining_time": "0:12:52", "throughput": 5644.57, "total_tokens": 17778600} {"current_steps": 27245, "total_steps": 33920, "loss": 0.4226, "lr": 1.1342949700327688e-06, "epoch": 16.06426886792453, "percentage": 80.32, "elapsed_time": "0:52:30", "remaining_time": "0:12:51", "throughput": 5644.69, "total_tokens": 17782760} {"current_steps": 27250, "total_steps": 33920, "loss": 0.4028, "lr": 1.1326637786328332e-06, "epoch": 16.067216981132077, "percentage": 80.34, "elapsed_time": "0:52:31", "remaining_time": "0:12:51", "throughput": 5644.75, "total_tokens": 17786952} {"current_steps": 27255, "total_steps": 33920, "loss": 0.3196, "lr": 1.1310336111268293e-06, "epoch": 16.07016509433962, "percentage": 80.35, "elapsed_time": "0:52:31", "remaining_time": "0:12:50", "throughput": 5644.61, "total_tokens": 17789544} {"current_steps": 27260, "total_steps": 33920, "loss": 0.3191, "lr": 1.1294044679463517e-06, "epoch": 16.07311320754717, "percentage": 80.37, "elapsed_time": "0:52:32", "remaining_time": "0:12:50", "throughput": 5644.74, "total_tokens": 17793576} {"current_steps": 27265, "total_steps": 33920, "loss": 0.2853, "lr": 1.1277763495227207e-06, "epoch": 16.076061320754718, "percentage": 80.38, "elapsed_time": "0:52:32", "remaining_time": "0:12:49", "throughput": 5644.92, "total_tokens": 17797896} {"current_steps": 27270, "total_steps": 33920, "loss": 0.2075, "lr": 1.1261492562869913e-06, "epoch": 16.079009433962263, "percentage": 80.4, "elapsed_time": "0:52:33", "remaining_time": "0:12:48", "throughput": 5644.89, "total_tokens": 17800712} {"current_steps": 27275, "total_steps": 33920, "loss": 0.2727, "lr": 1.1245231886699415e-06, "epoch": 16.08195754716981, "percentage": 80.41, "elapsed_time": "0:52:33", "remaining_time": "0:12:48", "throughput": 5644.84, "total_tokens": 17803592} {"current_steps": 27280, "total_steps": 33920, "loss": 0.3031, "lr": 1.12289814710208e-06, "epoch": 16.08490566037736, "percentage": 80.42, "elapsed_time": "0:52:34", "remaining_time": "0:12:47", "throughput": 5644.94, "total_tokens": 17806920} {"current_steps": 27285, "total_steps": 33920, "loss": 0.3875, "lr": 1.1212741320136433e-06, "epoch": 16.087853773584907, "percentage": 80.44, "elapsed_time": "0:52:35", "remaining_time": "0:12:47", "throughput": 5644.95, "total_tokens": 17810728} {"current_steps": 27290, "total_steps": 33920, "loss": 0.3086, "lr": 1.1196511438345963e-06, "epoch": 16.090801886792452, "percentage": 80.45, "elapsed_time": "0:52:35", "remaining_time": "0:12:46", "throughput": 5644.98, "total_tokens": 17813928} {"current_steps": 27295, "total_steps": 33920, "loss": 0.2685, "lr": 1.118029182994631e-06, "epoch": 16.09375, "percentage": 80.47, "elapsed_time": "0:52:36", "remaining_time": "0:12:46", "throughput": 5645.07, "total_tokens": 17817128} {"current_steps": 27300, "total_steps": 33920, "loss": 0.3804, "lr": 1.1164082499231704e-06, "epoch": 16.096698113207548, "percentage": 80.48, "elapsed_time": "0:52:36", "remaining_time": "0:12:45", "throughput": 5645.23, "total_tokens": 17820968} {"current_steps": 27305, "total_steps": 33920, "loss": 0.266, "lr": 1.114788345049364e-06, "epoch": 16.099646226415093, "percentage": 80.5, "elapsed_time": "0:52:37", "remaining_time": "0:12:44", "throughput": 5645.27, "total_tokens": 17823944} {"current_steps": 27310, "total_steps": 33920, "loss": 0.4085, "lr": 1.1131694688020872e-06, "epoch": 16.10259433962264, "percentage": 80.51, "elapsed_time": "0:52:37", "remaining_time": "0:12:44", "throughput": 5645.25, "total_tokens": 17826824} {"current_steps": 27315, "total_steps": 33920, "loss": 0.3681, "lr": 1.1115516216099453e-06, "epoch": 16.10554245283019, "percentage": 80.53, "elapsed_time": "0:52:38", "remaining_time": "0:12:43", "throughput": 5645.26, "total_tokens": 17829800} {"current_steps": 27320, "total_steps": 33920, "loss": 0.3387, "lr": 1.1099348039012698e-06, "epoch": 16.108490566037737, "percentage": 80.54, "elapsed_time": "0:52:38", "remaining_time": "0:12:43", "throughput": 5645.19, "total_tokens": 17832744} {"current_steps": 27325, "total_steps": 33920, "loss": 0.3687, "lr": 1.1083190161041202e-06, "epoch": 16.111438679245282, "percentage": 80.56, "elapsed_time": "0:52:39", "remaining_time": "0:12:42", "throughput": 5645.01, "total_tokens": 17835240} {"current_steps": 27330, "total_steps": 33920, "loss": 0.2662, "lr": 1.1067042586462822e-06, "epoch": 16.11438679245283, "percentage": 80.57, "elapsed_time": "0:52:39", "remaining_time": "0:12:41", "throughput": 5645.02, "total_tokens": 17838024} {"current_steps": 27335, "total_steps": 33920, "loss": 0.4647, "lr": 1.1050905319552718e-06, "epoch": 16.11733490566038, "percentage": 80.59, "elapsed_time": "0:52:40", "remaining_time": "0:12:41", "throughput": 5645.08, "total_tokens": 17841032} {"current_steps": 27340, "total_steps": 33920, "loss": 0.2946, "lr": 1.1034778364583293e-06, "epoch": 16.120283018867923, "percentage": 80.6, "elapsed_time": "0:52:41", "remaining_time": "0:12:40", "throughput": 5645.15, "total_tokens": 17844968} {"current_steps": 27345, "total_steps": 33920, "loss": 0.3007, "lr": 1.1018661725824231e-06, "epoch": 16.12323113207547, "percentage": 80.62, "elapsed_time": "0:52:41", "remaining_time": "0:12:40", "throughput": 5645.04, "total_tokens": 17847464} {"current_steps": 27350, "total_steps": 33920, "loss": 0.3636, "lr": 1.100255540754247e-06, "epoch": 16.12617924528302, "percentage": 80.63, "elapsed_time": "0:52:42", "remaining_time": "0:12:39", "throughput": 5644.99, "total_tokens": 17850504} {"current_steps": 27355, "total_steps": 33920, "loss": 0.3576, "lr": 1.0986459414002244e-06, "epoch": 16.129127358490567, "percentage": 80.65, "elapsed_time": "0:52:42", "remaining_time": "0:12:39", "throughput": 5645.1, "total_tokens": 17854248} {"current_steps": 27360, "total_steps": 33920, "loss": 0.354, "lr": 1.0970373749465008e-06, "epoch": 16.132075471698112, "percentage": 80.66, "elapsed_time": "0:52:43", "remaining_time": "0:12:38", "throughput": 5645.26, "total_tokens": 17858600} {"current_steps": 27365, "total_steps": 33920, "loss": 0.4058, "lr": 1.095429841818954e-06, "epoch": 16.13502358490566, "percentage": 80.68, "elapsed_time": "0:52:44", "remaining_time": "0:12:37", "throughput": 5645.36, "total_tokens": 17861928} {"current_steps": 27370, "total_steps": 33920, "loss": 0.4544, "lr": 1.093823342443185e-06, "epoch": 16.13797169811321, "percentage": 80.69, "elapsed_time": "0:52:44", "remaining_time": "0:12:37", "throughput": 5645.27, "total_tokens": 17864584} {"current_steps": 27375, "total_steps": 33920, "loss": 0.3409, "lr": 1.0922178772445203e-06, "epoch": 16.140919811320753, "percentage": 80.7, "elapsed_time": "0:52:45", "remaining_time": "0:12:36", "throughput": 5645.3, "total_tokens": 17867784} {"current_steps": 27380, "total_steps": 33920, "loss": 0.3639, "lr": 1.0906134466480146e-06, "epoch": 16.1438679245283, "percentage": 80.72, "elapsed_time": "0:52:45", "remaining_time": "0:12:36", "throughput": 5645.44, "total_tokens": 17871560} {"current_steps": 27385, "total_steps": 33920, "loss": 0.354, "lr": 1.0890100510784473e-06, "epoch": 16.14681603773585, "percentage": 80.73, "elapsed_time": "0:52:46", "remaining_time": "0:12:35", "throughput": 5645.43, "total_tokens": 17874440} {"current_steps": 27390, "total_steps": 33920, "loss": 0.4718, "lr": 1.0874076909603227e-06, "epoch": 16.149764150943398, "percentage": 80.75, "elapsed_time": "0:52:47", "remaining_time": "0:12:35", "throughput": 5645.63, "total_tokens": 17880584} {"current_steps": 27395, "total_steps": 33920, "loss": 0.3215, "lr": 1.0858063667178747e-06, "epoch": 16.152712264150942, "percentage": 80.76, "elapsed_time": "0:52:47", "remaining_time": "0:12:34", "throughput": 5645.81, "total_tokens": 17884360} {"current_steps": 27400, "total_steps": 33920, "loss": 0.4204, "lr": 1.0842060787750614e-06, "epoch": 16.15566037735849, "percentage": 80.78, "elapsed_time": "0:52:48", "remaining_time": "0:12:33", "throughput": 5645.82, "total_tokens": 17887272} {"current_steps": 27405, "total_steps": 33920, "loss": 0.2962, "lr": 1.0826068275555652e-06, "epoch": 16.15860849056604, "percentage": 80.79, "elapsed_time": "0:52:48", "remaining_time": "0:12:33", "throughput": 5645.98, "total_tokens": 17890888} {"current_steps": 27410, "total_steps": 33920, "loss": 0.2733, "lr": 1.081008613482794e-06, "epoch": 16.161556603773583, "percentage": 80.81, "elapsed_time": "0:52:49", "remaining_time": "0:12:32", "throughput": 5646.1, "total_tokens": 17894440} {"current_steps": 27415, "total_steps": 33920, "loss": 0.2423, "lr": 1.079411436979883e-06, "epoch": 16.16450471698113, "percentage": 80.82, "elapsed_time": "0:52:49", "remaining_time": "0:12:32", "throughput": 5646.23, "total_tokens": 17898184} {"current_steps": 27420, "total_steps": 33920, "loss": 0.318, "lr": 1.0778152984696905e-06, "epoch": 16.16745283018868, "percentage": 80.84, "elapsed_time": "0:52:50", "remaining_time": "0:12:31", "throughput": 5646.35, "total_tokens": 17901576} {"current_steps": 27425, "total_steps": 33920, "loss": 0.2908, "lr": 1.0762201983747993e-06, "epoch": 16.170400943396228, "percentage": 80.85, "elapsed_time": "0:52:51", "remaining_time": "0:12:31", "throughput": 5646.53, "total_tokens": 17905640} {"current_steps": 27430, "total_steps": 33920, "loss": 0.2446, "lr": 1.0746261371175238e-06, "epoch": 16.173349056603772, "percentage": 80.87, "elapsed_time": "0:52:51", "remaining_time": "0:12:30", "throughput": 5646.61, "total_tokens": 17909224} {"current_steps": 27435, "total_steps": 33920, "loss": 0.2277, "lr": 1.0730331151198953e-06, "epoch": 16.17629716981132, "percentage": 80.88, "elapsed_time": "0:52:52", "remaining_time": "0:12:29", "throughput": 5646.64, "total_tokens": 17912232} {"current_steps": 27440, "total_steps": 33920, "loss": 0.287, "lr": 1.0714411328036733e-06, "epoch": 16.17924528301887, "percentage": 80.9, "elapsed_time": "0:52:52", "remaining_time": "0:12:29", "throughput": 5646.69, "total_tokens": 17915464} {"current_steps": 27445, "total_steps": 33920, "loss": 0.2722, "lr": 1.0698501905903435e-06, "epoch": 16.182193396226417, "percentage": 80.91, "elapsed_time": "0:52:53", "remaining_time": "0:12:28", "throughput": 5646.67, "total_tokens": 17918120} {"current_steps": 27450, "total_steps": 33920, "loss": 0.3386, "lr": 1.0682602889011134e-06, "epoch": 16.18514150943396, "percentage": 80.93, "elapsed_time": "0:52:53", "remaining_time": "0:12:28", "throughput": 5646.77, "total_tokens": 17921704} {"current_steps": 27455, "total_steps": 33920, "loss": 0.225, "lr": 1.0666714281569152e-06, "epoch": 16.18808962264151, "percentage": 80.94, "elapsed_time": "0:52:54", "remaining_time": "0:12:27", "throughput": 5646.77, "total_tokens": 17924616} {"current_steps": 27460, "total_steps": 33920, "loss": 0.3371, "lr": 1.0650836087784095e-06, "epoch": 16.191037735849058, "percentage": 80.96, "elapsed_time": "0:52:54", "remaining_time": "0:12:26", "throughput": 5646.73, "total_tokens": 17927240} {"current_steps": 27465, "total_steps": 33920, "loss": 0.2921, "lr": 1.0634968311859768e-06, "epoch": 16.193985849056602, "percentage": 80.97, "elapsed_time": "0:52:55", "remaining_time": "0:12:26", "throughput": 5646.62, "total_tokens": 17929704} {"current_steps": 27470, "total_steps": 33920, "loss": 0.3896, "lr": 1.0619110957997237e-06, "epoch": 16.19693396226415, "percentage": 80.98, "elapsed_time": "0:52:55", "remaining_time": "0:12:25", "throughput": 5646.59, "total_tokens": 17932392} {"current_steps": 27475, "total_steps": 33920, "loss": 0.2726, "lr": 1.06032640303948e-06, "epoch": 16.1998820754717, "percentage": 81.0, "elapsed_time": "0:52:56", "remaining_time": "0:12:25", "throughput": 5646.67, "total_tokens": 17936264} {"current_steps": 27480, "total_steps": 33920, "loss": 0.4424, "lr": 1.0587427533248002e-06, "epoch": 16.202830188679247, "percentage": 81.01, "elapsed_time": "0:52:57", "remaining_time": "0:12:24", "throughput": 5646.75, "total_tokens": 17939848} {"current_steps": 27485, "total_steps": 33920, "loss": 0.2593, "lr": 1.057160147074961e-06, "epoch": 16.20577830188679, "percentage": 81.03, "elapsed_time": "0:52:57", "remaining_time": "0:12:23", "throughput": 5646.81, "total_tokens": 17943080} {"current_steps": 27490, "total_steps": 33920, "loss": 0.2887, "lr": 1.0555785847089657e-06, "epoch": 16.20872641509434, "percentage": 81.04, "elapsed_time": "0:52:58", "remaining_time": "0:12:23", "throughput": 5646.62, "total_tokens": 17945384} {"current_steps": 27495, "total_steps": 33920, "loss": 0.379, "lr": 1.0539980666455407e-06, "epoch": 16.211674528301888, "percentage": 81.06, "elapsed_time": "0:52:58", "remaining_time": "0:12:22", "throughput": 5646.67, "total_tokens": 17948488} {"current_steps": 27500, "total_steps": 33920, "loss": 0.3682, "lr": 1.052418593303134e-06, "epoch": 16.214622641509433, "percentage": 81.07, "elapsed_time": "0:52:59", "remaining_time": "0:12:22", "throughput": 5646.92, "total_tokens": 17953000} {"current_steps": 27505, "total_steps": 33920, "loss": 0.2317, "lr": 1.0508401650999178e-06, "epoch": 16.21757075471698, "percentage": 81.09, "elapsed_time": "0:52:59", "remaining_time": "0:12:21", "throughput": 5646.94, "total_tokens": 17956648} {"current_steps": 27510, "total_steps": 33920, "loss": 0.2588, "lr": 1.0492627824537877e-06, "epoch": 16.22051886792453, "percentage": 81.1, "elapsed_time": "0:53:00", "remaining_time": "0:12:21", "throughput": 5646.83, "total_tokens": 17959368} {"current_steps": 27515, "total_steps": 33920, "loss": 0.2621, "lr": 1.0476864457823626e-06, "epoch": 16.223466981132077, "percentage": 81.12, "elapsed_time": "0:53:01", "remaining_time": "0:12:20", "throughput": 5646.94, "total_tokens": 17963016} {"current_steps": 27520, "total_steps": 33920, "loss": 0.4282, "lr": 1.0461111555029836e-06, "epoch": 16.22641509433962, "percentage": 81.13, "elapsed_time": "0:53:01", "remaining_time": "0:12:19", "throughput": 5646.8, "total_tokens": 17965448} {"current_steps": 27525, "total_steps": 33920, "loss": 0.2906, "lr": 1.0445369120327175e-06, "epoch": 16.22936320754717, "percentage": 81.15, "elapsed_time": "0:53:02", "remaining_time": "0:12:19", "throughput": 5646.95, "total_tokens": 17969512} {"current_steps": 27530, "total_steps": 33920, "loss": 0.4581, "lr": 1.0429637157883516e-06, "epoch": 16.232311320754718, "percentage": 81.16, "elapsed_time": "0:53:02", "remaining_time": "0:12:18", "throughput": 5647.08, "total_tokens": 17973000} {"current_steps": 27535, "total_steps": 33920, "loss": 0.2866, "lr": 1.041391567186395e-06, "epoch": 16.235259433962263, "percentage": 81.18, "elapsed_time": "0:53:03", "remaining_time": "0:12:18", "throughput": 5647.14, "total_tokens": 17976232} {"current_steps": 27540, "total_steps": 33920, "loss": 0.2283, "lr": 1.0398204666430821e-06, "epoch": 16.23820754716981, "percentage": 81.19, "elapsed_time": "0:53:03", "remaining_time": "0:12:17", "throughput": 5647.03, "total_tokens": 17978728} {"current_steps": 27545, "total_steps": 33920, "loss": 0.229, "lr": 1.0382504145743667e-06, "epoch": 16.24115566037736, "percentage": 81.21, "elapsed_time": "0:53:04", "remaining_time": "0:12:16", "throughput": 5647.1, "total_tokens": 17982120} {"current_steps": 27550, "total_steps": 33920, "loss": 0.2887, "lr": 1.0366814113959294e-06, "epoch": 16.244103773584907, "percentage": 81.22, "elapsed_time": "0:53:04", "remaining_time": "0:12:16", "throughput": 5647.1, "total_tokens": 17985192} {"current_steps": 27555, "total_steps": 33920, "loss": 0.2458, "lr": 1.0351134575231697e-06, "epoch": 16.247051886792452, "percentage": 81.24, "elapsed_time": "0:53:05", "remaining_time": "0:12:15", "throughput": 5647.19, "total_tokens": 17988456} {"current_steps": 27560, "total_steps": 33920, "loss": 0.2224, "lr": 1.0335465533712098e-06, "epoch": 16.25, "percentage": 81.25, "elapsed_time": "0:53:05", "remaining_time": "0:12:15", "throughput": 5647.17, "total_tokens": 17991272} {"current_steps": 27565, "total_steps": 33920, "loss": 0.2824, "lr": 1.031980699354894e-06, "epoch": 16.252948113207548, "percentage": 81.26, "elapsed_time": "0:53:06", "remaining_time": "0:12:14", "throughput": 5647.29, "total_tokens": 17994792} {"current_steps": 27570, "total_steps": 33920, "loss": 0.2755, "lr": 1.03041589588879e-06, "epoch": 16.255896226415093, "percentage": 81.28, "elapsed_time": "0:53:06", "remaining_time": "0:12:14", "throughput": 5647.34, "total_tokens": 17997992} {"current_steps": 27575, "total_steps": 33920, "loss": 0.2818, "lr": 1.0288521433871834e-06, "epoch": 16.25884433962264, "percentage": 81.29, "elapsed_time": "0:53:07", "remaining_time": "0:12:13", "throughput": 5647.44, "total_tokens": 18001256} {"current_steps": 27580, "total_steps": 33920, "loss": 0.3305, "lr": 1.0272894422640866e-06, "epoch": 16.26179245283019, "percentage": 81.31, "elapsed_time": "0:53:08", "remaining_time": "0:12:12", "throughput": 5647.42, "total_tokens": 18004008} {"current_steps": 27585, "total_steps": 33920, "loss": 0.2132, "lr": 1.0257277929332332e-06, "epoch": 16.264740566037737, "percentage": 81.32, "elapsed_time": "0:53:08", "remaining_time": "0:12:12", "throughput": 5647.51, "total_tokens": 18007176} {"current_steps": 27590, "total_steps": 33920, "loss": 0.3307, "lr": 1.0241671958080745e-06, "epoch": 16.267688679245282, "percentage": 81.34, "elapsed_time": "0:53:09", "remaining_time": "0:12:11", "throughput": 5647.72, "total_tokens": 18011240} {"current_steps": 27595, "total_steps": 33920, "loss": 0.3755, "lr": 1.0226076513017858e-06, "epoch": 16.27063679245283, "percentage": 81.35, "elapsed_time": "0:53:09", "remaining_time": "0:12:11", "throughput": 5647.77, "total_tokens": 18014664} {"current_steps": 27600, "total_steps": 33920, "loss": 0.2907, "lr": 1.0210491598272625e-06, "epoch": 16.27358490566038, "percentage": 81.37, "elapsed_time": "0:53:10", "remaining_time": "0:12:10", "throughput": 5647.93, "total_tokens": 18018536} {"current_steps": 27605, "total_steps": 33920, "loss": 0.4067, "lr": 1.0194917217971229e-06, "epoch": 16.276533018867923, "percentage": 81.38, "elapsed_time": "0:53:10", "remaining_time": "0:12:09", "throughput": 5648.08, "total_tokens": 18022312} {"current_steps": 27610, "total_steps": 33920, "loss": 0.2838, "lr": 1.0179353376237038e-06, "epoch": 16.27948113207547, "percentage": 81.4, "elapsed_time": "0:53:11", "remaining_time": "0:12:09", "throughput": 5648.04, "total_tokens": 18024968} {"current_steps": 27615, "total_steps": 33920, "loss": 0.2966, "lr": 1.0163800077190672e-06, "epoch": 16.28242924528302, "percentage": 81.41, "elapsed_time": "0:53:11", "remaining_time": "0:12:08", "throughput": 5647.98, "total_tokens": 18028104} {"current_steps": 27620, "total_steps": 33920, "loss": 0.3349, "lr": 1.0148257324949916e-06, "epoch": 16.285377358490567, "percentage": 81.43, "elapsed_time": "0:53:12", "remaining_time": "0:12:08", "throughput": 5647.98, "total_tokens": 18031080} {"current_steps": 27625, "total_steps": 33920, "loss": 0.2549, "lr": 1.0132725123629783e-06, "epoch": 16.288325471698112, "percentage": 81.44, "elapsed_time": "0:53:13", "remaining_time": "0:12:07", "throughput": 5647.89, "total_tokens": 18033832} {"current_steps": 27630, "total_steps": 33920, "loss": 0.3281, "lr": 1.0117203477342497e-06, "epoch": 16.29127358490566, "percentage": 81.46, "elapsed_time": "0:53:13", "remaining_time": "0:12:07", "throughput": 5647.76, "total_tokens": 18036264} {"current_steps": 27635, "total_steps": 33920, "loss": 0.3533, "lr": 1.0101692390197477e-06, "epoch": 16.29422169811321, "percentage": 81.47, "elapsed_time": "0:53:14", "remaining_time": "0:12:06", "throughput": 5647.97, "total_tokens": 18040616} {"current_steps": 27640, "total_steps": 33920, "loss": 0.2777, "lr": 1.0086191866301331e-06, "epoch": 16.297169811320753, "percentage": 81.49, "elapsed_time": "0:53:14", "remaining_time": "0:12:05", "throughput": 5648.11, "total_tokens": 18044712} {"current_steps": 27645, "total_steps": 33920, "loss": 0.2246, "lr": 1.0070701909757918e-06, "epoch": 16.3001179245283, "percentage": 81.5, "elapsed_time": "0:53:15", "remaining_time": "0:12:05", "throughput": 5648.33, "total_tokens": 18049256} {"current_steps": 27650, "total_steps": 33920, "loss": 0.383, "lr": 1.0055222524668267e-06, "epoch": 16.30306603773585, "percentage": 81.52, "elapsed_time": "0:53:16", "remaining_time": "0:12:04", "throughput": 5648.45, "total_tokens": 18053032} {"current_steps": 27655, "total_steps": 33920, "loss": 0.3418, "lr": 1.00397537151306e-06, "epoch": 16.306014150943398, "percentage": 81.53, "elapsed_time": "0:53:16", "remaining_time": "0:12:04", "throughput": 5648.29, "total_tokens": 18055368} {"current_steps": 27660, "total_steps": 33920, "loss": 0.4552, "lr": 1.002429548524036e-06, "epoch": 16.308962264150942, "percentage": 81.54, "elapsed_time": "0:53:17", "remaining_time": "0:12:03", "throughput": 5648.28, "total_tokens": 18058856} {"current_steps": 27665, "total_steps": 33920, "loss": 0.2833, "lr": 1.0008847839090175e-06, "epoch": 16.31191037735849, "percentage": 81.56, "elapsed_time": "0:53:17", "remaining_time": "0:12:03", "throughput": 5648.38, "total_tokens": 18062280} {"current_steps": 27670, "total_steps": 33920, "loss": 0.294, "lr": 9.993410780769862e-07, "epoch": 16.31485849056604, "percentage": 81.57, "elapsed_time": "0:53:18", "remaining_time": "0:12:02", "throughput": 5648.43, "total_tokens": 18065288} {"current_steps": 27675, "total_steps": 33920, "loss": 0.3718, "lr": 9.977984314366463e-07, "epoch": 16.317806603773583, "percentage": 81.59, "elapsed_time": "0:53:18", "remaining_time": "0:12:01", "throughput": 5648.58, "total_tokens": 18069352} {"current_steps": 27680, "total_steps": 33920, "loss": 0.2307, "lr": 9.962568443964216e-07, "epoch": 16.32075471698113, "percentage": 81.6, "elapsed_time": "0:53:19", "remaining_time": "0:12:01", "throughput": 5648.74, "total_tokens": 18073224} {"current_steps": 27685, "total_steps": 33920, "loss": 0.4056, "lr": 9.947163173644524e-07, "epoch": 16.32370283018868, "percentage": 81.62, "elapsed_time": "0:53:19", "remaining_time": "0:12:00", "throughput": 5648.74, "total_tokens": 18075880} {"current_steps": 27690, "total_steps": 33920, "loss": 0.2761, "lr": 9.931768507486007e-07, "epoch": 16.326650943396228, "percentage": 81.63, "elapsed_time": "0:53:20", "remaining_time": "0:12:00", "throughput": 5648.7, "total_tokens": 18078792} {"current_steps": 27695, "total_steps": 33920, "loss": 0.3088, "lr": 9.916384449564453e-07, "epoch": 16.329599056603772, "percentage": 81.65, "elapsed_time": "0:53:21", "remaining_time": "0:11:59", "throughput": 5648.78, "total_tokens": 18082248} {"current_steps": 27700, "total_steps": 33920, "loss": 0.2517, "lr": 9.90101100395287e-07, "epoch": 16.33254716981132, "percentage": 81.66, "elapsed_time": "0:53:21", "remaining_time": "0:11:58", "throughput": 5648.85, "total_tokens": 18085384} {"current_steps": 27705, "total_steps": 33920, "loss": 0.332, "lr": 9.885648174721428e-07, "epoch": 16.33549528301887, "percentage": 81.68, "elapsed_time": "0:53:22", "remaining_time": "0:11:58", "throughput": 5648.95, "total_tokens": 18088616} {"current_steps": 27710, "total_steps": 33920, "loss": 0.2902, "lr": 9.870295965937532e-07, "epoch": 16.338443396226417, "percentage": 81.69, "elapsed_time": "0:53:22", "remaining_time": "0:11:57", "throughput": 5649.18, "total_tokens": 18092808} {"current_steps": 27715, "total_steps": 33920, "loss": 0.396, "lr": 9.854954381665727e-07, "epoch": 16.34139150943396, "percentage": 81.71, "elapsed_time": "0:53:23", "remaining_time": "0:11:57", "throughput": 5649.2, "total_tokens": 18095656} {"current_steps": 27720, "total_steps": 33920, "loss": 0.2304, "lr": 9.83962342596776e-07, "epoch": 16.34433962264151, "percentage": 81.72, "elapsed_time": "0:53:23", "remaining_time": "0:11:56", "throughput": 5649.14, "total_tokens": 18098120} {"current_steps": 27725, "total_steps": 33920, "loss": 0.2218, "lr": 9.824303102902576e-07, "epoch": 16.347287735849058, "percentage": 81.74, "elapsed_time": "0:53:24", "remaining_time": "0:11:55", "throughput": 5649.33, "total_tokens": 18101768} {"current_steps": 27730, "total_steps": 33920, "loss": 0.33, "lr": 9.808993416526292e-07, "epoch": 16.350235849056602, "percentage": 81.75, "elapsed_time": "0:53:24", "remaining_time": "0:11:55", "throughput": 5649.45, "total_tokens": 18105352} {"current_steps": 27735, "total_steps": 33920, "loss": 0.2587, "lr": 9.793694370892204e-07, "epoch": 16.35318396226415, "percentage": 81.77, "elapsed_time": "0:53:25", "remaining_time": "0:11:54", "throughput": 5649.68, "total_tokens": 18110600} {"current_steps": 27740, "total_steps": 33920, "loss": 0.2693, "lr": 9.77840597005082e-07, "epoch": 16.3561320754717, "percentage": 81.78, "elapsed_time": "0:53:26", "remaining_time": "0:11:54", "throughput": 5649.83, "total_tokens": 18114440} {"current_steps": 27745, "total_steps": 33920, "loss": 0.4437, "lr": 9.763128218049806e-07, "epoch": 16.359080188679247, "percentage": 81.8, "elapsed_time": "0:53:26", "remaining_time": "0:11:53", "throughput": 5649.84, "total_tokens": 18117352} {"current_steps": 27750, "total_steps": 33920, "loss": 0.3237, "lr": 9.747861118934005e-07, "epoch": 16.36202830188679, "percentage": 81.81, "elapsed_time": "0:53:27", "remaining_time": "0:11:53", "throughput": 5649.95, "total_tokens": 18120680} {"current_steps": 27755, "total_steps": 33920, "loss": 0.2719, "lr": 9.732604676745443e-07, "epoch": 16.36497641509434, "percentage": 81.82, "elapsed_time": "0:53:27", "remaining_time": "0:11:52", "throughput": 5649.91, "total_tokens": 18123240} {"current_steps": 27760, "total_steps": 33920, "loss": 0.3171, "lr": 9.717358895523333e-07, "epoch": 16.367924528301888, "percentage": 81.84, "elapsed_time": "0:53:28", "remaining_time": "0:11:51", "throughput": 5649.81, "total_tokens": 18125832} {"current_steps": 27765, "total_steps": 33920, "loss": 0.2841, "lr": 9.702123779304074e-07, "epoch": 16.370872641509433, "percentage": 81.85, "elapsed_time": "0:53:28", "remaining_time": "0:11:51", "throughput": 5649.85, "total_tokens": 18128872} {"current_steps": 27770, "total_steps": 33920, "loss": 0.2985, "lr": 9.686899332121203e-07, "epoch": 16.37382075471698, "percentage": 81.87, "elapsed_time": "0:53:29", "remaining_time": "0:11:50", "throughput": 5649.85, "total_tokens": 18131688} {"current_steps": 27775, "total_steps": 33920, "loss": 0.1736, "lr": 9.671685558005488e-07, "epoch": 16.37676886792453, "percentage": 81.88, "elapsed_time": "0:53:29", "remaining_time": "0:11:50", "throughput": 5649.96, "total_tokens": 18135304} {"current_steps": 27780, "total_steps": 33920, "loss": 0.2442, "lr": 9.656482460984828e-07, "epoch": 16.379716981132077, "percentage": 81.9, "elapsed_time": "0:53:30", "remaining_time": "0:11:49", "throughput": 5649.98, "total_tokens": 18138504} {"current_steps": 27785, "total_steps": 33920, "loss": 0.3456, "lr": 9.641290045084307e-07, "epoch": 16.38266509433962, "percentage": 81.91, "elapsed_time": "0:53:30", "remaining_time": "0:11:48", "throughput": 5650.12, "total_tokens": 18141864} {"current_steps": 27790, "total_steps": 33920, "loss": 0.2506, "lr": 9.626108314326182e-07, "epoch": 16.38561320754717, "percentage": 81.93, "elapsed_time": "0:53:31", "remaining_time": "0:11:48", "throughput": 5650.18, "total_tokens": 18144872} {"current_steps": 27795, "total_steps": 33920, "loss": 0.2807, "lr": 9.610937272729881e-07, "epoch": 16.388561320754718, "percentage": 81.94, "elapsed_time": "0:53:32", "remaining_time": "0:11:47", "throughput": 5650.42, "total_tokens": 18149448} {"current_steps": 27800, "total_steps": 33920, "loss": 0.4135, "lr": 9.595776924311996e-07, "epoch": 16.391509433962263, "percentage": 81.96, "elapsed_time": "0:53:32", "remaining_time": "0:11:47", "throughput": 5650.58, "total_tokens": 18152968} {"current_steps": 27805, "total_steps": 33920, "loss": 0.3678, "lr": 9.580627273086313e-07, "epoch": 16.39445754716981, "percentage": 81.97, "elapsed_time": "0:53:33", "remaining_time": "0:11:46", "throughput": 5650.63, "total_tokens": 18156264} {"current_steps": 27810, "total_steps": 33920, "loss": 0.2459, "lr": 9.565488323063754e-07, "epoch": 16.39740566037736, "percentage": 81.99, "elapsed_time": "0:53:33", "remaining_time": "0:11:46", "throughput": 5650.63, "total_tokens": 18159112} {"current_steps": 27815, "total_steps": 33920, "loss": 0.3786, "lr": 9.55036007825243e-07, "epoch": 16.400353773584907, "percentage": 82.0, "elapsed_time": "0:53:34", "remaining_time": "0:11:45", "throughput": 5650.53, "total_tokens": 18161800} {"current_steps": 27820, "total_steps": 33920, "loss": 0.3418, "lr": 9.535242542657602e-07, "epoch": 16.403301886792452, "percentage": 82.02, "elapsed_time": "0:53:34", "remaining_time": "0:11:44", "throughput": 5650.54, "total_tokens": 18164808} {"current_steps": 27825, "total_steps": 33920, "loss": 0.508, "lr": 9.520135720281692e-07, "epoch": 16.40625, "percentage": 82.03, "elapsed_time": "0:53:35", "remaining_time": "0:11:44", "throughput": 5650.63, "total_tokens": 18168072} {"current_steps": 27830, "total_steps": 33920, "loss": 0.2945, "lr": 9.505039615124318e-07, "epoch": 16.409198113207548, "percentage": 82.05, "elapsed_time": "0:53:35", "remaining_time": "0:11:43", "throughput": 5650.63, "total_tokens": 18171464} {"current_steps": 27835, "total_steps": 33920, "loss": 0.3909, "lr": 9.489954231182235e-07, "epoch": 16.412146226415093, "percentage": 82.06, "elapsed_time": "0:53:36", "remaining_time": "0:11:43", "throughput": 5650.61, "total_tokens": 18174824} {"current_steps": 27840, "total_steps": 33920, "loss": 0.309, "lr": 9.474879572449352e-07, "epoch": 16.41509433962264, "percentage": 82.08, "elapsed_time": "0:53:36", "remaining_time": "0:11:42", "throughput": 5650.64, "total_tokens": 18177672} {"current_steps": 27845, "total_steps": 33920, "loss": 0.2923, "lr": 9.459815642916759e-07, "epoch": 16.41804245283019, "percentage": 82.09, "elapsed_time": "0:53:37", "remaining_time": "0:11:41", "throughput": 5650.67, "total_tokens": 18180680} {"current_steps": 27850, "total_steps": 33920, "loss": 0.1989, "lr": 9.444762446572692e-07, "epoch": 16.420990566037737, "percentage": 82.1, "elapsed_time": "0:53:37", "remaining_time": "0:11:41", "throughput": 5650.6, "total_tokens": 18183176} {"current_steps": 27855, "total_steps": 33920, "loss": 0.2629, "lr": 9.429719987402541e-07, "epoch": 16.423938679245282, "percentage": 82.12, "elapsed_time": "0:53:38", "remaining_time": "0:11:40", "throughput": 5650.74, "total_tokens": 18186920} {"current_steps": 27860, "total_steps": 33920, "loss": 0.3354, "lr": 9.414688269388883e-07, "epoch": 16.42688679245283, "percentage": 82.13, "elapsed_time": "0:53:39", "remaining_time": "0:11:40", "throughput": 5650.84, "total_tokens": 18190248} {"current_steps": 27865, "total_steps": 33920, "loss": 0.264, "lr": 9.3996672965114e-07, "epoch": 16.42983490566038, "percentage": 82.15, "elapsed_time": "0:53:39", "remaining_time": "0:11:39", "throughput": 5650.84, "total_tokens": 18193320} {"current_steps": 27870, "total_steps": 33920, "loss": 0.2176, "lr": 9.384657072747e-07, "epoch": 16.432783018867923, "percentage": 82.16, "elapsed_time": "0:53:40", "remaining_time": "0:11:39", "throughput": 5650.96, "total_tokens": 18196776} {"current_steps": 27875, "total_steps": 33920, "loss": 0.3374, "lr": 9.369657602069676e-07, "epoch": 16.43573113207547, "percentage": 82.18, "elapsed_time": "0:53:40", "remaining_time": "0:11:38", "throughput": 5650.88, "total_tokens": 18199496} {"current_steps": 27880, "total_steps": 33920, "loss": 0.371, "lr": 9.354668888450608e-07, "epoch": 16.43867924528302, "percentage": 82.19, "elapsed_time": "0:53:41", "remaining_time": "0:11:37", "throughput": 5650.69, "total_tokens": 18201800} {"current_steps": 27885, "total_steps": 33920, "loss": 0.3468, "lr": 9.339690935858125e-07, "epoch": 16.441627358490567, "percentage": 82.21, "elapsed_time": "0:53:41", "remaining_time": "0:11:37", "throughput": 5650.7, "total_tokens": 18204648} {"current_steps": 27890, "total_steps": 33920, "loss": 0.3576, "lr": 9.324723748257697e-07, "epoch": 16.444575471698112, "percentage": 82.22, "elapsed_time": "0:53:42", "remaining_time": "0:11:36", "throughput": 5650.69, "total_tokens": 18207528} {"current_steps": 27895, "total_steps": 33920, "loss": 0.3242, "lr": 9.309767329611963e-07, "epoch": 16.44752358490566, "percentage": 82.24, "elapsed_time": "0:53:42", "remaining_time": "0:11:36", "throughput": 5650.73, "total_tokens": 18210568} {"current_steps": 27900, "total_steps": 33920, "loss": 0.2337, "lr": 9.294821683880695e-07, "epoch": 16.45047169811321, "percentage": 82.25, "elapsed_time": "0:53:43", "remaining_time": "0:11:35", "throughput": 5650.77, "total_tokens": 18213544} {"current_steps": 27905, "total_steps": 33920, "loss": 0.2543, "lr": 9.279886815020816e-07, "epoch": 16.453419811320753, "percentage": 82.27, "elapsed_time": "0:53:43", "remaining_time": "0:11:34", "throughput": 5650.91, "total_tokens": 18217352} {"current_steps": 27910, "total_steps": 33920, "loss": 0.3855, "lr": 9.264962726986393e-07, "epoch": 16.4563679245283, "percentage": 82.28, "elapsed_time": "0:53:44", "remaining_time": "0:11:34", "throughput": 5650.91, "total_tokens": 18220456} {"current_steps": 27915, "total_steps": 33920, "loss": 0.2477, "lr": 9.250049423728652e-07, "epoch": 16.45931603773585, "percentage": 82.3, "elapsed_time": "0:53:44", "remaining_time": "0:11:33", "throughput": 5650.98, "total_tokens": 18223880} {"current_steps": 27920, "total_steps": 33920, "loss": 0.3087, "lr": 9.235146909195936e-07, "epoch": 16.462264150943398, "percentage": 82.31, "elapsed_time": "0:53:45", "remaining_time": "0:11:33", "throughput": 5650.99, "total_tokens": 18226856} {"current_steps": 27925, "total_steps": 33920, "loss": 0.2958, "lr": 9.220255187333771e-07, "epoch": 16.465212264150942, "percentage": 82.33, "elapsed_time": "0:53:45", "remaining_time": "0:11:32", "throughput": 5651.06, "total_tokens": 18230248} {"current_steps": 27930, "total_steps": 33920, "loss": 0.3608, "lr": 9.205374262084798e-07, "epoch": 16.46816037735849, "percentage": 82.34, "elapsed_time": "0:53:46", "remaining_time": "0:11:31", "throughput": 5650.78, "total_tokens": 18232136} {"current_steps": 27935, "total_steps": 33920, "loss": 0.4124, "lr": 9.190504137388806e-07, "epoch": 16.47110849056604, "percentage": 82.36, "elapsed_time": "0:53:47", "remaining_time": "0:11:31", "throughput": 5650.96, "total_tokens": 18236552} {"current_steps": 27940, "total_steps": 33920, "loss": 0.3101, "lr": 9.175644817182722e-07, "epoch": 16.474056603773583, "percentage": 82.37, "elapsed_time": "0:53:47", "remaining_time": "0:11:30", "throughput": 5650.88, "total_tokens": 18239240} {"current_steps": 27945, "total_steps": 33920, "loss": 0.3018, "lr": 9.16079630540061e-07, "epoch": 16.47700471698113, "percentage": 82.39, "elapsed_time": "0:53:48", "remaining_time": "0:11:30", "throughput": 5650.81, "total_tokens": 18242088} {"current_steps": 27950, "total_steps": 33920, "loss": 0.3046, "lr": 9.145958605973676e-07, "epoch": 16.47995283018868, "percentage": 82.4, "elapsed_time": "0:53:48", "remaining_time": "0:11:29", "throughput": 5650.73, "total_tokens": 18244936} {"current_steps": 27955, "total_steps": 33920, "loss": 0.3508, "lr": 9.131131722830289e-07, "epoch": 16.482900943396228, "percentage": 82.41, "elapsed_time": "0:53:49", "remaining_time": "0:11:29", "throughput": 5650.82, "total_tokens": 18248520} {"current_steps": 27960, "total_steps": 33920, "loss": 0.387, "lr": 9.116315659895892e-07, "epoch": 16.485849056603772, "percentage": 82.43, "elapsed_time": "0:53:49", "remaining_time": "0:11:28", "throughput": 5650.82, "total_tokens": 18251752} {"current_steps": 27965, "total_steps": 33920, "loss": 0.2943, "lr": 9.10151042109314e-07, "epoch": 16.48879716981132, "percentage": 82.44, "elapsed_time": "0:53:50", "remaining_time": "0:11:27", "throughput": 5650.91, "total_tokens": 18255144} {"current_steps": 27970, "total_steps": 33920, "loss": 0.3224, "lr": 9.086716010341767e-07, "epoch": 16.49174528301887, "percentage": 82.46, "elapsed_time": "0:53:51", "remaining_time": "0:11:27", "throughput": 5650.97, "total_tokens": 18258376} {"current_steps": 27975, "total_steps": 33920, "loss": 0.23, "lr": 9.071932431558655e-07, "epoch": 16.494693396226417, "percentage": 82.47, "elapsed_time": "0:53:51", "remaining_time": "0:11:26", "throughput": 5650.96, "total_tokens": 18261128} {"current_steps": 27980, "total_steps": 33920, "loss": 0.2526, "lr": 9.057159688657824e-07, "epoch": 16.49764150943396, "percentage": 82.49, "elapsed_time": "0:53:52", "remaining_time": "0:11:26", "throughput": 5651.06, "total_tokens": 18264360} {"current_steps": 27985, "total_steps": 33920, "loss": 0.2936, "lr": 9.042397785550405e-07, "epoch": 16.50058962264151, "percentage": 82.5, "elapsed_time": "0:53:52", "remaining_time": "0:11:25", "throughput": 5651.14, "total_tokens": 18267528} {"current_steps": 27990, "total_steps": 33920, "loss": 0.299, "lr": 9.027646726144707e-07, "epoch": 16.503537735849058, "percentage": 82.52, "elapsed_time": "0:53:53", "remaining_time": "0:11:24", "throughput": 5651.19, "total_tokens": 18270952} {"current_steps": 27995, "total_steps": 33920, "loss": 0.2675, "lr": 9.012906514346115e-07, "epoch": 16.506485849056602, "percentage": 82.53, "elapsed_time": "0:53:53", "remaining_time": "0:11:24", "throughput": 5651.29, "total_tokens": 18274472} {"current_steps": 28000, "total_steps": 33920, "loss": 0.2104, "lr": 8.99817715405717e-07, "epoch": 16.50943396226415, "percentage": 82.55, "elapsed_time": "0:53:54", "remaining_time": "0:11:23", "throughput": 5651.51, "total_tokens": 18278568} {"current_steps": 28005, "total_steps": 33920, "loss": 0.226, "lr": 8.983458649177529e-07, "epoch": 16.5123820754717, "percentage": 82.56, "elapsed_time": "0:53:54", "remaining_time": "0:11:23", "throughput": 5651.4, "total_tokens": 18280936} {"current_steps": 28010, "total_steps": 33920, "loss": 0.3768, "lr": 8.968751003603982e-07, "epoch": 16.515330188679247, "percentage": 82.58, "elapsed_time": "0:53:55", "remaining_time": "0:11:22", "throughput": 5651.41, "total_tokens": 18283944} {"current_steps": 28015, "total_steps": 33920, "loss": 0.3887, "lr": 8.95405422123043e-07, "epoch": 16.51827830188679, "percentage": 82.59, "elapsed_time": "0:53:55", "remaining_time": "0:11:22", "throughput": 5651.42, "total_tokens": 18287144} {"current_steps": 28020, "total_steps": 33920, "loss": 0.4066, "lr": 8.939368305947932e-07, "epoch": 16.52122641509434, "percentage": 82.61, "elapsed_time": "0:53:56", "remaining_time": "0:11:21", "throughput": 5651.56, "total_tokens": 18291080} {"current_steps": 28025, "total_steps": 33920, "loss": 0.281, "lr": 8.92469326164464e-07, "epoch": 16.524174528301888, "percentage": 82.62, "elapsed_time": "0:53:56", "remaining_time": "0:11:20", "throughput": 5651.49, "total_tokens": 18293768} {"current_steps": 28030, "total_steps": 33920, "loss": 0.1902, "lr": 8.910029092205829e-07, "epoch": 16.527122641509433, "percentage": 82.64, "elapsed_time": "0:53:57", "remaining_time": "0:11:20", "throughput": 5651.33, "total_tokens": 18296040} {"current_steps": 28035, "total_steps": 33920, "loss": 0.1956, "lr": 8.895375801513906e-07, "epoch": 16.53007075471698, "percentage": 82.65, "elapsed_time": "0:53:58", "remaining_time": "0:11:19", "throughput": 5651.52, "total_tokens": 18300552} {"current_steps": 28040, "total_steps": 33920, "loss": 0.266, "lr": 8.880733393448377e-07, "epoch": 16.53301886792453, "percentage": 82.67, "elapsed_time": "0:53:58", "remaining_time": "0:11:19", "throughput": 5651.64, "total_tokens": 18304040} {"current_steps": 28045, "total_steps": 33920, "loss": 0.3377, "lr": 8.866101871885907e-07, "epoch": 16.535966981132077, "percentage": 82.68, "elapsed_time": "0:53:59", "remaining_time": "0:11:18", "throughput": 5651.66, "total_tokens": 18307016} {"current_steps": 28050, "total_steps": 33920, "loss": 0.3493, "lr": 8.851481240700249e-07, "epoch": 16.53891509433962, "percentage": 82.69, "elapsed_time": "0:53:59", "remaining_time": "0:11:17", "throughput": 5651.76, "total_tokens": 18310344} {"current_steps": 28055, "total_steps": 33920, "loss": 0.2163, "lr": 8.836871503762257e-07, "epoch": 16.54186320754717, "percentage": 82.71, "elapsed_time": "0:54:00", "remaining_time": "0:11:17", "throughput": 5651.89, "total_tokens": 18313704} {"current_steps": 28060, "total_steps": 33920, "loss": 0.297, "lr": 8.822272664939946e-07, "epoch": 16.544811320754718, "percentage": 82.72, "elapsed_time": "0:54:00", "remaining_time": "0:11:16", "throughput": 5651.96, "total_tokens": 18317032} {"current_steps": 28065, "total_steps": 33920, "loss": 0.3069, "lr": 8.80768472809842e-07, "epoch": 16.547759433962263, "percentage": 82.74, "elapsed_time": "0:54:01", "remaining_time": "0:11:16", "throughput": 5651.97, "total_tokens": 18320008} {"current_steps": 28070, "total_steps": 33920, "loss": 0.5205, "lr": 8.793107697099884e-07, "epoch": 16.55070754716981, "percentage": 82.75, "elapsed_time": "0:54:01", "remaining_time": "0:11:15", "throughput": 5651.97, "total_tokens": 18322888} {"current_steps": 28075, "total_steps": 33920, "loss": 0.3003, "lr": 8.778541575803673e-07, "epoch": 16.55365566037736, "percentage": 82.77, "elapsed_time": "0:54:02", "remaining_time": "0:11:15", "throughput": 5651.95, "total_tokens": 18325608} {"current_steps": 28080, "total_steps": 33920, "loss": 0.2158, "lr": 8.763986368066241e-07, "epoch": 16.556603773584907, "percentage": 82.78, "elapsed_time": "0:54:02", "remaining_time": "0:11:14", "throughput": 5651.97, "total_tokens": 18328616} {"current_steps": 28085, "total_steps": 33920, "loss": 0.2683, "lr": 8.749442077741138e-07, "epoch": 16.559551886792452, "percentage": 82.8, "elapsed_time": "0:54:03", "remaining_time": "0:11:13", "throughput": 5651.98, "total_tokens": 18331496} {"current_steps": 28090, "total_steps": 33920, "loss": 0.4226, "lr": 8.734908708679024e-07, "epoch": 16.5625, "percentage": 82.81, "elapsed_time": "0:54:03", "remaining_time": "0:11:13", "throughput": 5652.0, "total_tokens": 18334440} {"current_steps": 28095, "total_steps": 33920, "loss": 0.3538, "lr": 8.72038626472767e-07, "epoch": 16.565448113207548, "percentage": 82.83, "elapsed_time": "0:54:04", "remaining_time": "0:11:12", "throughput": 5652.02, "total_tokens": 18337384} {"current_steps": 28100, "total_steps": 33920, "loss": 0.3107, "lr": 8.705874749731962e-07, "epoch": 16.568396226415093, "percentage": 82.84, "elapsed_time": "0:54:04", "remaining_time": "0:11:12", "throughput": 5652.09, "total_tokens": 18340520} {"current_steps": 28105, "total_steps": 33920, "loss": 0.3541, "lr": 8.691374167533867e-07, "epoch": 16.57134433962264, "percentage": 82.86, "elapsed_time": "0:54:05", "remaining_time": "0:11:11", "throughput": 5652.16, "total_tokens": 18343656} {"current_steps": 28110, "total_steps": 33920, "loss": 0.2594, "lr": 8.6768845219725e-07, "epoch": 16.57429245283019, "percentage": 82.87, "elapsed_time": "0:54:05", "remaining_time": "0:11:10", "throughput": 5652.25, "total_tokens": 18347176} {"current_steps": 28115, "total_steps": 33920, "loss": 0.3494, "lr": 8.662405816884056e-07, "epoch": 16.577240566037737, "percentage": 82.89, "elapsed_time": "0:54:06", "remaining_time": "0:11:10", "throughput": 5652.37, "total_tokens": 18350792} {"current_steps": 28120, "total_steps": 33920, "loss": 0.1981, "lr": 8.647938056101824e-07, "epoch": 16.580188679245282, "percentage": 82.9, "elapsed_time": "0:54:07", "remaining_time": "0:11:09", "throughput": 5652.51, "total_tokens": 18354408} {"current_steps": 28125, "total_steps": 33920, "loss": 0.3991, "lr": 8.63348124345621e-07, "epoch": 16.58313679245283, "percentage": 82.92, "elapsed_time": "0:54:07", "remaining_time": "0:11:09", "throughput": 5652.52, "total_tokens": 18357352} {"current_steps": 28130, "total_steps": 33920, "loss": 0.2869, "lr": 8.619035382774716e-07, "epoch": 16.58608490566038, "percentage": 82.93, "elapsed_time": "0:54:08", "remaining_time": "0:11:08", "throughput": 5652.52, "total_tokens": 18360136} {"current_steps": 28135, "total_steps": 33920, "loss": 0.2447, "lr": 8.60460047788193e-07, "epoch": 16.589033018867923, "percentage": 82.95, "elapsed_time": "0:54:08", "remaining_time": "0:11:07", "throughput": 5652.52, "total_tokens": 18363080} {"current_steps": 28140, "total_steps": 33920, "loss": 0.2602, "lr": 8.590176532599587e-07, "epoch": 16.59198113207547, "percentage": 82.96, "elapsed_time": "0:54:09", "remaining_time": "0:11:07", "throughput": 5652.72, "total_tokens": 18367528} {"current_steps": 28145, "total_steps": 33920, "loss": 0.276, "lr": 8.575763550746475e-07, "epoch": 16.59492924528302, "percentage": 82.97, "elapsed_time": "0:54:09", "remaining_time": "0:11:06", "throughput": 5652.79, "total_tokens": 18370856} {"current_steps": 28150, "total_steps": 33920, "loss": 0.4144, "lr": 8.56136153613848e-07, "epoch": 16.597877358490567, "percentage": 82.99, "elapsed_time": "0:54:10", "remaining_time": "0:11:06", "throughput": 5652.86, "total_tokens": 18373864} {"current_steps": 28155, "total_steps": 33920, "loss": 0.2785, "lr": 8.546970492588619e-07, "epoch": 16.600825471698112, "percentage": 83.0, "elapsed_time": "0:54:10", "remaining_time": "0:11:05", "throughput": 5653.01, "total_tokens": 18377544} {"current_steps": 28160, "total_steps": 33920, "loss": 0.3432, "lr": 8.532590423906973e-07, "epoch": 16.60377358490566, "percentage": 83.02, "elapsed_time": "0:54:11", "remaining_time": "0:11:05", "throughput": 5653.06, "total_tokens": 18380680} {"current_steps": 28165, "total_steps": 33920, "loss": 0.2575, "lr": 8.518221333900728e-07, "epoch": 16.60672169811321, "percentage": 83.03, "elapsed_time": "0:54:11", "remaining_time": "0:11:04", "throughput": 5653.09, "total_tokens": 18383560} {"current_steps": 28170, "total_steps": 33920, "loss": 0.3153, "lr": 8.503863226374148e-07, "epoch": 16.609669811320753, "percentage": 83.05, "elapsed_time": "0:54:12", "remaining_time": "0:11:03", "throughput": 5653.11, "total_tokens": 18386312} {"current_steps": 28175, "total_steps": 33920, "loss": 0.263, "lr": 8.489516105128632e-07, "epoch": 16.6126179245283, "percentage": 83.06, "elapsed_time": "0:54:12", "remaining_time": "0:11:03", "throughput": 5653.24, "total_tokens": 18389768} {"current_steps": 28180, "total_steps": 33920, "loss": 0.3698, "lr": 8.475179973962621e-07, "epoch": 16.61556603773585, "percentage": 83.08, "elapsed_time": "0:54:13", "remaining_time": "0:11:02", "throughput": 5653.29, "total_tokens": 18393096} {"current_steps": 28185, "total_steps": 33920, "loss": 0.2733, "lr": 8.460854836671678e-07, "epoch": 16.618514150943398, "percentage": 83.09, "elapsed_time": "0:54:14", "remaining_time": "0:11:02", "throughput": 5653.27, "total_tokens": 18396136} {"current_steps": 28190, "total_steps": 33920, "loss": 0.2841, "lr": 8.446540697048445e-07, "epoch": 16.621462264150942, "percentage": 83.11, "elapsed_time": "0:54:14", "remaining_time": "0:11:01", "throughput": 5653.31, "total_tokens": 18399016} {"current_steps": 28195, "total_steps": 33920, "loss": 0.3294, "lr": 8.432237558882639e-07, "epoch": 16.62441037735849, "percentage": 83.12, "elapsed_time": "0:54:15", "remaining_time": "0:11:00", "throughput": 5653.45, "total_tokens": 18402792} {"current_steps": 28200, "total_steps": 33920, "loss": 0.2806, "lr": 8.417945425961083e-07, "epoch": 16.62735849056604, "percentage": 83.14, "elapsed_time": "0:54:15", "remaining_time": "0:11:00", "throughput": 5653.5, "total_tokens": 18405736} {"current_steps": 28205, "total_steps": 33920, "loss": 0.383, "lr": 8.403664302067688e-07, "epoch": 16.630306603773583, "percentage": 83.15, "elapsed_time": "0:54:16", "remaining_time": "0:10:59", "throughput": 5653.59, "total_tokens": 18408968} {"current_steps": 28210, "total_steps": 33920, "loss": 0.2602, "lr": 8.389394190983446e-07, "epoch": 16.63325471698113, "percentage": 83.17, "elapsed_time": "0:54:16", "remaining_time": "0:10:59", "throughput": 5653.63, "total_tokens": 18412200} {"current_steps": 28215, "total_steps": 33920, "loss": 0.2409, "lr": 8.37513509648642e-07, "epoch": 16.63620283018868, "percentage": 83.18, "elapsed_time": "0:54:17", "remaining_time": "0:10:58", "throughput": 5653.67, "total_tokens": 18415336} {"current_steps": 28220, "total_steps": 33920, "loss": 0.4233, "lr": 8.360887022351771e-07, "epoch": 16.639150943396228, "percentage": 83.2, "elapsed_time": "0:54:17", "remaining_time": "0:10:58", "throughput": 5653.74, "total_tokens": 18418728} {"current_steps": 28225, "total_steps": 33920, "loss": 0.3023, "lr": 8.346649972351739e-07, "epoch": 16.642099056603772, "percentage": 83.21, "elapsed_time": "0:54:18", "remaining_time": "0:10:57", "throughput": 5654.0, "total_tokens": 18425896} {"current_steps": 28230, "total_steps": 33920, "loss": 0.3672, "lr": 8.33242395025563e-07, "epoch": 16.64504716981132, "percentage": 83.23, "elapsed_time": "0:54:19", "remaining_time": "0:10:56", "throughput": 5653.95, "total_tokens": 18428552} {"current_steps": 28235, "total_steps": 33920, "loss": 0.3192, "lr": 8.318208959829871e-07, "epoch": 16.64799528301887, "percentage": 83.24, "elapsed_time": "0:54:19", "remaining_time": "0:10:56", "throughput": 5653.79, "total_tokens": 18431176} {"current_steps": 28240, "total_steps": 33920, "loss": 0.3292, "lr": 8.304005004837929e-07, "epoch": 16.650943396226417, "percentage": 83.25, "elapsed_time": "0:54:20", "remaining_time": "0:10:55", "throughput": 5653.9, "total_tokens": 18434760} {"current_steps": 28245, "total_steps": 33920, "loss": 0.3402, "lr": 8.289812089040344e-07, "epoch": 16.65389150943396, "percentage": 83.27, "elapsed_time": "0:54:21", "remaining_time": "0:10:55", "throughput": 5653.94, "total_tokens": 18437896} {"current_steps": 28250, "total_steps": 33920, "loss": 0.291, "lr": 8.275630216194785e-07, "epoch": 16.65683962264151, "percentage": 83.28, "elapsed_time": "0:54:21", "remaining_time": "0:10:54", "throughput": 5654.01, "total_tokens": 18441064} {"current_steps": 28255, "total_steps": 33920, "loss": 0.3331, "lr": 8.261459390055948e-07, "epoch": 16.659787735849058, "percentage": 83.3, "elapsed_time": "0:54:22", "remaining_time": "0:10:54", "throughput": 5653.91, "total_tokens": 18443560} {"current_steps": 28260, "total_steps": 33920, "loss": 0.3333, "lr": 8.24729961437562e-07, "epoch": 16.662735849056602, "percentage": 83.31, "elapsed_time": "0:54:22", "remaining_time": "0:10:53", "throughput": 5653.87, "total_tokens": 18446632} {"current_steps": 28265, "total_steps": 33920, "loss": 0.3638, "lr": 8.233150892902653e-07, "epoch": 16.66568396226415, "percentage": 83.33, "elapsed_time": "0:54:23", "remaining_time": "0:10:52", "throughput": 5653.97, "total_tokens": 18450088} {"current_steps": 28270, "total_steps": 33920, "loss": 0.2796, "lr": 8.219013229383005e-07, "epoch": 16.6686320754717, "percentage": 83.34, "elapsed_time": "0:54:23", "remaining_time": "0:10:52", "throughput": 5654.13, "total_tokens": 18454152} {"current_steps": 28275, "total_steps": 33920, "loss": 0.3369, "lr": 8.204886627559666e-07, "epoch": 16.671580188679247, "percentage": 83.36, "elapsed_time": "0:54:24", "remaining_time": "0:10:51", "throughput": 5654.02, "total_tokens": 18456840} {"current_steps": 28280, "total_steps": 33920, "loss": 0.2469, "lr": 8.190771091172722e-07, "epoch": 16.67452830188679, "percentage": 83.37, "elapsed_time": "0:54:24", "remaining_time": "0:10:51", "throughput": 5654.05, "total_tokens": 18460168} {"current_steps": 28285, "total_steps": 33920, "loss": 0.5131, "lr": 8.176666623959323e-07, "epoch": 16.67747641509434, "percentage": 83.39, "elapsed_time": "0:54:25", "remaining_time": "0:10:50", "throughput": 5654.02, "total_tokens": 18463464} {"current_steps": 28290, "total_steps": 33920, "loss": 0.2696, "lr": 8.162573229653681e-07, "epoch": 16.680424528301888, "percentage": 83.4, "elapsed_time": "0:54:26", "remaining_time": "0:10:50", "throughput": 5653.98, "total_tokens": 18466952} {"current_steps": 28295, "total_steps": 33920, "loss": 0.2215, "lr": 8.148490911987073e-07, "epoch": 16.683372641509433, "percentage": 83.42, "elapsed_time": "0:54:26", "remaining_time": "0:10:49", "throughput": 5653.85, "total_tokens": 18469448} {"current_steps": 28300, "total_steps": 33920, "loss": 0.4376, "lr": 8.134419674687876e-07, "epoch": 16.68632075471698, "percentage": 83.43, "elapsed_time": "0:54:27", "remaining_time": "0:10:48", "throughput": 5653.96, "total_tokens": 18473000} {"current_steps": 28305, "total_steps": 33920, "loss": 0.3218, "lr": 8.120359521481502e-07, "epoch": 16.68926886792453, "percentage": 83.45, "elapsed_time": "0:54:27", "remaining_time": "0:10:48", "throughput": 5653.96, "total_tokens": 18475848} {"current_steps": 28310, "total_steps": 33920, "loss": 0.2893, "lr": 8.106310456090438e-07, "epoch": 16.692216981132077, "percentage": 83.46, "elapsed_time": "0:54:28", "remaining_time": "0:10:47", "throughput": 5654.11, "total_tokens": 18479848} {"current_steps": 28315, "total_steps": 33920, "loss": 0.3681, "lr": 8.092272482234231e-07, "epoch": 16.69516509433962, "percentage": 83.48, "elapsed_time": "0:54:29", "remaining_time": "0:10:47", "throughput": 5654.32, "total_tokens": 18484264} {"current_steps": 28320, "total_steps": 33920, "loss": 0.2736, "lr": 8.078245603629486e-07, "epoch": 16.69811320754717, "percentage": 83.49, "elapsed_time": "0:54:29", "remaining_time": "0:10:46", "throughput": 5654.31, "total_tokens": 18487080} {"current_steps": 28325, "total_steps": 33920, "loss": 0.2139, "lr": 8.0642298239899e-07, "epoch": 16.701061320754718, "percentage": 83.51, "elapsed_time": "0:54:30", "remaining_time": "0:10:45", "throughput": 5654.33, "total_tokens": 18490248} {"current_steps": 28330, "total_steps": 33920, "loss": 0.3513, "lr": 8.050225147026202e-07, "epoch": 16.704009433962263, "percentage": 83.52, "elapsed_time": "0:54:30", "remaining_time": "0:10:45", "throughput": 5654.54, "total_tokens": 18494504} {"current_steps": 28335, "total_steps": 33920, "loss": 0.4131, "lr": 8.03623157644619e-07, "epoch": 16.70695754716981, "percentage": 83.53, "elapsed_time": "0:54:31", "remaining_time": "0:10:44", "throughput": 5654.69, "total_tokens": 18498120} {"current_steps": 28340, "total_steps": 33920, "loss": 0.2537, "lr": 8.022249115954728e-07, "epoch": 16.70990566037736, "percentage": 83.55, "elapsed_time": "0:54:31", "remaining_time": "0:10:44", "throughput": 5654.79, "total_tokens": 18501768} {"current_steps": 28345, "total_steps": 33920, "loss": 0.2565, "lr": 8.008277769253709e-07, "epoch": 16.712853773584907, "percentage": 83.56, "elapsed_time": "0:54:32", "remaining_time": "0:10:43", "throughput": 5654.62, "total_tokens": 18504136} {"current_steps": 28350, "total_steps": 33920, "loss": 0.3364, "lr": 7.994317540042135e-07, "epoch": 16.715801886792452, "percentage": 83.58, "elapsed_time": "0:54:32", "remaining_time": "0:10:43", "throughput": 5654.62, "total_tokens": 18507208} {"current_steps": 28355, "total_steps": 33920, "loss": 0.1977, "lr": 7.980368432016017e-07, "epoch": 16.71875, "percentage": 83.59, "elapsed_time": "0:54:33", "remaining_time": "0:10:42", "throughput": 5654.71, "total_tokens": 18510472} {"current_steps": 28360, "total_steps": 33920, "loss": 0.313, "lr": 7.966430448868461e-07, "epoch": 16.721698113207548, "percentage": 83.61, "elapsed_time": "0:54:33", "remaining_time": "0:10:41", "throughput": 5654.65, "total_tokens": 18513064} {"current_steps": 28365, "total_steps": 33920, "loss": 0.3984, "lr": 7.952503594289601e-07, "epoch": 16.724646226415093, "percentage": 83.62, "elapsed_time": "0:54:34", "remaining_time": "0:10:41", "throughput": 5654.53, "total_tokens": 18515624} {"current_steps": 28370, "total_steps": 33920, "loss": 0.3171, "lr": 7.93858787196663e-07, "epoch": 16.72759433962264, "percentage": 83.64, "elapsed_time": "0:54:35", "remaining_time": "0:10:40", "throughput": 5654.58, "total_tokens": 18518888} {"current_steps": 28375, "total_steps": 33920, "loss": 0.3995, "lr": 7.92468328558379e-07, "epoch": 16.73054245283019, "percentage": 83.65, "elapsed_time": "0:54:35", "remaining_time": "0:10:40", "throughput": 5654.52, "total_tokens": 18521416} {"current_steps": 28380, "total_steps": 33920, "loss": 0.392, "lr": 7.910789838822386e-07, "epoch": 16.733490566037737, "percentage": 83.67, "elapsed_time": "0:54:36", "remaining_time": "0:10:39", "throughput": 5654.59, "total_tokens": 18524712} {"current_steps": 28385, "total_steps": 33920, "loss": 0.4172, "lr": 7.89690753536076e-07, "epoch": 16.736438679245282, "percentage": 83.68, "elapsed_time": "0:54:36", "remaining_time": "0:10:38", "throughput": 5654.6, "total_tokens": 18527560} {"current_steps": 28390, "total_steps": 33920, "loss": 0.3907, "lr": 7.883036378874326e-07, "epoch": 16.73938679245283, "percentage": 83.7, "elapsed_time": "0:54:37", "remaining_time": "0:10:38", "throughput": 5654.67, "total_tokens": 18530696} {"current_steps": 28395, "total_steps": 33920, "loss": 0.2807, "lr": 7.86917637303552e-07, "epoch": 16.74233490566038, "percentage": 83.71, "elapsed_time": "0:54:37", "remaining_time": "0:10:37", "throughput": 5654.83, "total_tokens": 18534280} {"current_steps": 28400, "total_steps": 33920, "loss": 0.3088, "lr": 7.855327521513851e-07, "epoch": 16.745283018867923, "percentage": 83.73, "elapsed_time": "0:54:38", "remaining_time": "0:10:37", "throughput": 5654.75, "total_tokens": 18536648} {"current_steps": 28405, "total_steps": 33920, "loss": 0.2986, "lr": 7.841489827975851e-07, "epoch": 16.74823113207547, "percentage": 83.74, "elapsed_time": "0:54:38", "remaining_time": "0:10:36", "throughput": 5654.7, "total_tokens": 18539496} {"current_steps": 28410, "total_steps": 33920, "loss": 0.3336, "lr": 7.827663296085109e-07, "epoch": 16.75117924528302, "percentage": 83.76, "elapsed_time": "0:54:39", "remaining_time": "0:10:35", "throughput": 5654.57, "total_tokens": 18541896} {"current_steps": 28415, "total_steps": 33920, "loss": 0.336, "lr": 7.813847929502255e-07, "epoch": 16.754127358490567, "percentage": 83.77, "elapsed_time": "0:54:39", "remaining_time": "0:10:35", "throughput": 5654.54, "total_tokens": 18544840} {"current_steps": 28420, "total_steps": 33920, "loss": 0.2786, "lr": 7.800043731884982e-07, "epoch": 16.757075471698112, "percentage": 83.79, "elapsed_time": "0:54:40", "remaining_time": "0:10:34", "throughput": 5654.63, "total_tokens": 18548808} {"current_steps": 28425, "total_steps": 33920, "loss": 0.3584, "lr": 7.786250706888005e-07, "epoch": 16.76002358490566, "percentage": 83.8, "elapsed_time": "0:54:40", "remaining_time": "0:10:34", "throughput": 5654.63, "total_tokens": 18552040} {"current_steps": 28430, "total_steps": 33920, "loss": 0.2194, "lr": 7.772468858163085e-07, "epoch": 16.76297169811321, "percentage": 83.81, "elapsed_time": "0:54:41", "remaining_time": "0:10:33", "throughput": 5654.69, "total_tokens": 18555176} {"current_steps": 28435, "total_steps": 33920, "loss": 0.2222, "lr": 7.758698189359026e-07, "epoch": 16.765919811320753, "percentage": 83.83, "elapsed_time": "0:54:42", "remaining_time": "0:10:33", "throughput": 5654.86, "total_tokens": 18561032} {"current_steps": 28440, "total_steps": 33920, "loss": 0.2306, "lr": 7.744938704121658e-07, "epoch": 16.7688679245283, "percentage": 83.84, "elapsed_time": "0:54:42", "remaining_time": "0:10:32", "throughput": 5654.86, "total_tokens": 18563848} {"current_steps": 28445, "total_steps": 33920, "loss": 0.2519, "lr": 7.731190406093892e-07, "epoch": 16.77181603773585, "percentage": 83.86, "elapsed_time": "0:54:43", "remaining_time": "0:10:31", "throughput": 5654.92, "total_tokens": 18567144} {"current_steps": 28450, "total_steps": 33920, "loss": 0.526, "lr": 7.717453298915617e-07, "epoch": 16.774764150943398, "percentage": 83.87, "elapsed_time": "0:54:43", "remaining_time": "0:10:31", "throughput": 5654.88, "total_tokens": 18569768} {"current_steps": 28455, "total_steps": 33920, "loss": 0.2791, "lr": 7.703727386223825e-07, "epoch": 16.777712264150942, "percentage": 83.89, "elapsed_time": "0:54:44", "remaining_time": "0:10:30", "throughput": 5654.82, "total_tokens": 18572328} {"current_steps": 28460, "total_steps": 33920, "loss": 0.3235, "lr": 7.690012671652491e-07, "epoch": 16.78066037735849, "percentage": 83.9, "elapsed_time": "0:54:44", "remaining_time": "0:10:30", "throughput": 5654.8, "total_tokens": 18575272} {"current_steps": 28465, "total_steps": 33920, "loss": 0.3406, "lr": 7.676309158832651e-07, "epoch": 16.78360849056604, "percentage": 83.92, "elapsed_time": "0:54:45", "remaining_time": "0:10:29", "throughput": 5654.78, "total_tokens": 18578152} {"current_steps": 28470, "total_steps": 33920, "loss": 0.3584, "lr": 7.662616851392362e-07, "epoch": 16.786556603773583, "percentage": 83.93, "elapsed_time": "0:54:45", "remaining_time": "0:10:29", "throughput": 5654.84, "total_tokens": 18581608} {"current_steps": 28475, "total_steps": 33920, "loss": 0.5609, "lr": 7.648935752956732e-07, "epoch": 16.78950471698113, "percentage": 83.95, "elapsed_time": "0:54:46", "remaining_time": "0:10:28", "throughput": 5654.98, "total_tokens": 18585512} {"current_steps": 28480, "total_steps": 33920, "loss": 0.3372, "lr": 7.635265867147867e-07, "epoch": 16.79245283018868, "percentage": 83.96, "elapsed_time": "0:54:47", "remaining_time": "0:10:27", "throughput": 5654.87, "total_tokens": 18587912} {"current_steps": 28485, "total_steps": 33920, "loss": 0.3827, "lr": 7.621607197584963e-07, "epoch": 16.795400943396228, "percentage": 83.98, "elapsed_time": "0:54:47", "remaining_time": "0:10:27", "throughput": 5655.02, "total_tokens": 18591464} {"current_steps": 28490, "total_steps": 33920, "loss": 0.454, "lr": 7.607959747884186e-07, "epoch": 16.798349056603772, "percentage": 83.99, "elapsed_time": "0:54:48", "remaining_time": "0:10:26", "throughput": 5655.03, "total_tokens": 18594312} {"current_steps": 28495, "total_steps": 33920, "loss": 0.3148, "lr": 7.594323521658769e-07, "epoch": 16.80129716981132, "percentage": 84.01, "elapsed_time": "0:54:48", "remaining_time": "0:10:26", "throughput": 5655.03, "total_tokens": 18597256} {"current_steps": 28500, "total_steps": 33920, "loss": 0.3437, "lr": 7.580698522518958e-07, "epoch": 16.80424528301887, "percentage": 84.02, "elapsed_time": "0:54:49", "remaining_time": "0:10:25", "throughput": 5655.01, "total_tokens": 18600168} {"current_steps": 28505, "total_steps": 33920, "loss": 0.2778, "lr": 7.567084754072035e-07, "epoch": 16.807193396226417, "percentage": 84.04, "elapsed_time": "0:54:49", "remaining_time": "0:10:24", "throughput": 5655.06, "total_tokens": 18603304} {"current_steps": 28510, "total_steps": 33920, "loss": 0.2765, "lr": 7.553482219922282e-07, "epoch": 16.81014150943396, "percentage": 84.05, "elapsed_time": "0:54:50", "remaining_time": "0:10:24", "throughput": 5655.1, "total_tokens": 18606312} {"current_steps": 28515, "total_steps": 33920, "loss": 0.2633, "lr": 7.539890923671061e-07, "epoch": 16.81308962264151, "percentage": 84.07, "elapsed_time": "0:54:50", "remaining_time": "0:10:23", "throughput": 5655.1, "total_tokens": 18609576} {"current_steps": 28520, "total_steps": 33920, "loss": 0.2989, "lr": 7.526310868916708e-07, "epoch": 16.816037735849058, "percentage": 84.08, "elapsed_time": "0:54:51", "remaining_time": "0:10:23", "throughput": 5655.15, "total_tokens": 18612904} {"current_steps": 28525, "total_steps": 33920, "loss": 0.2481, "lr": 7.512742059254602e-07, "epoch": 16.818985849056602, "percentage": 84.09, "elapsed_time": "0:54:51", "remaining_time": "0:10:22", "throughput": 5655.31, "total_tokens": 18616616} {"current_steps": 28530, "total_steps": 33920, "loss": 0.2846, "lr": 7.499184498277151e-07, "epoch": 16.82193396226415, "percentage": 84.11, "elapsed_time": "0:54:52", "remaining_time": "0:10:22", "throughput": 5655.38, "total_tokens": 18620008} {"current_steps": 28535, "total_steps": 33920, "loss": 0.2309, "lr": 7.485638189573758e-07, "epoch": 16.8248820754717, "percentage": 84.12, "elapsed_time": "0:54:52", "remaining_time": "0:10:21", "throughput": 5655.39, "total_tokens": 18622984} {"current_steps": 28540, "total_steps": 33920, "loss": 0.3069, "lr": 7.472103136730891e-07, "epoch": 16.827830188679247, "percentage": 84.14, "elapsed_time": "0:54:53", "remaining_time": "0:10:20", "throughput": 5655.43, "total_tokens": 18626024} {"current_steps": 28545, "total_steps": 33920, "loss": 0.4178, "lr": 7.458579343331996e-07, "epoch": 16.83077830188679, "percentage": 84.15, "elapsed_time": "0:54:54", "remaining_time": "0:10:20", "throughput": 5655.59, "total_tokens": 18629576} {"current_steps": 28550, "total_steps": 33920, "loss": 0.26, "lr": 7.445066812957569e-07, "epoch": 16.83372641509434, "percentage": 84.17, "elapsed_time": "0:54:54", "remaining_time": "0:10:19", "throughput": 5655.62, "total_tokens": 18632744} {"current_steps": 28555, "total_steps": 33920, "loss": 0.3094, "lr": 7.43156554918511e-07, "epoch": 16.836674528301888, "percentage": 84.18, "elapsed_time": "0:54:55", "remaining_time": "0:10:19", "throughput": 5655.68, "total_tokens": 18635784} {"current_steps": 28560, "total_steps": 33920, "loss": 0.3556, "lr": 7.418075555589132e-07, "epoch": 16.839622641509433, "percentage": 84.2, "elapsed_time": "0:54:55", "remaining_time": "0:10:18", "throughput": 5655.84, "total_tokens": 18639464} {"current_steps": 28565, "total_steps": 33920, "loss": 0.4945, "lr": 7.404596835741168e-07, "epoch": 16.84257075471698, "percentage": 84.21, "elapsed_time": "0:54:56", "remaining_time": "0:10:17", "throughput": 5655.95, "total_tokens": 18642760} {"current_steps": 28570, "total_steps": 33920, "loss": 0.3026, "lr": 7.391129393209751e-07, "epoch": 16.84551886792453, "percentage": 84.23, "elapsed_time": "0:54:56", "remaining_time": "0:10:17", "throughput": 5656.07, "total_tokens": 18646536} {"current_steps": 28575, "total_steps": 33920, "loss": 0.2912, "lr": 7.377673231560478e-07, "epoch": 16.848466981132077, "percentage": 84.24, "elapsed_time": "0:54:57", "remaining_time": "0:10:16", "throughput": 5656.15, "total_tokens": 18649704} {"current_steps": 28580, "total_steps": 33920, "loss": 0.3859, "lr": 7.364228354355907e-07, "epoch": 16.85141509433962, "percentage": 84.26, "elapsed_time": "0:54:57", "remaining_time": "0:10:16", "throughput": 5656.13, "total_tokens": 18652424} {"current_steps": 28585, "total_steps": 33920, "loss": 0.3358, "lr": 7.350794765155627e-07, "epoch": 16.85436320754717, "percentage": 84.27, "elapsed_time": "0:54:58", "remaining_time": "0:10:15", "throughput": 5656.12, "total_tokens": 18655368} {"current_steps": 28590, "total_steps": 33920, "loss": 0.3491, "lr": 7.337372467516246e-07, "epoch": 16.857311320754718, "percentage": 84.29, "elapsed_time": "0:54:58", "remaining_time": "0:10:14", "throughput": 5656.13, "total_tokens": 18658344} {"current_steps": 28595, "total_steps": 33920, "loss": 0.3281, "lr": 7.323961464991369e-07, "epoch": 16.860259433962263, "percentage": 84.3, "elapsed_time": "0:54:59", "remaining_time": "0:10:14", "throughput": 5656.19, "total_tokens": 18661448} {"current_steps": 28600, "total_steps": 33920, "loss": 0.2802, "lr": 7.310561761131601e-07, "epoch": 16.86320754716981, "percentage": 84.32, "elapsed_time": "0:54:59", "remaining_time": "0:10:13", "throughput": 5656.27, "total_tokens": 18664648} {"current_steps": 28605, "total_steps": 33920, "loss": 0.3634, "lr": 7.297173359484605e-07, "epoch": 16.86615566037736, "percentage": 84.33, "elapsed_time": "0:55:00", "remaining_time": "0:10:13", "throughput": 5656.17, "total_tokens": 18667400} {"current_steps": 28610, "total_steps": 33920, "loss": 0.2503, "lr": 7.283796263595e-07, "epoch": 16.869103773584907, "percentage": 84.35, "elapsed_time": "0:55:00", "remaining_time": "0:10:12", "throughput": 5656.22, "total_tokens": 18670440} {"current_steps": 28615, "total_steps": 33920, "loss": 0.522, "lr": 7.270430477004431e-07, "epoch": 16.872051886792452, "percentage": 84.36, "elapsed_time": "0:55:01", "remaining_time": "0:10:12", "throughput": 5656.2, "total_tokens": 18673032} {"current_steps": 28620, "total_steps": 33920, "loss": 0.447, "lr": 7.257076003251545e-07, "epoch": 16.875, "percentage": 84.38, "elapsed_time": "0:55:01", "remaining_time": "0:10:11", "throughput": 5656.4, "total_tokens": 18677192} {"current_steps": 28625, "total_steps": 33920, "loss": 0.2254, "lr": 7.243732845871998e-07, "epoch": 16.877948113207548, "percentage": 84.39, "elapsed_time": "0:55:02", "remaining_time": "0:10:10", "throughput": 5656.69, "total_tokens": 18682280} {"current_steps": 28630, "total_steps": 33920, "loss": 0.3509, "lr": 7.230401008398441e-07, "epoch": 16.880896226415093, "percentage": 84.4, "elapsed_time": "0:55:03", "remaining_time": "0:10:10", "throughput": 5656.81, "total_tokens": 18685736} {"current_steps": 28635, "total_steps": 33920, "loss": 0.334, "lr": 7.217080494360546e-07, "epoch": 16.88384433962264, "percentage": 84.42, "elapsed_time": "0:55:03", "remaining_time": "0:10:09", "throughput": 5656.9, "total_tokens": 18689032} {"current_steps": 28640, "total_steps": 33920, "loss": 0.3288, "lr": 7.20377130728498e-07, "epoch": 16.88679245283019, "percentage": 84.43, "elapsed_time": "0:55:04", "remaining_time": "0:10:09", "throughput": 5657.04, "total_tokens": 18692552} {"current_steps": 28645, "total_steps": 33920, "loss": 0.28, "lr": 7.190473450695407e-07, "epoch": 16.889740566037737, "percentage": 84.45, "elapsed_time": "0:55:04", "remaining_time": "0:10:08", "throughput": 5657.16, "total_tokens": 18695912} {"current_steps": 28650, "total_steps": 33920, "loss": 0.289, "lr": 7.177186928112484e-07, "epoch": 16.892688679245282, "percentage": 84.46, "elapsed_time": "0:55:05", "remaining_time": "0:10:07", "throughput": 5657.17, "total_tokens": 18698728} {"current_steps": 28655, "total_steps": 33920, "loss": 0.3824, "lr": 7.163911743053876e-07, "epoch": 16.89563679245283, "percentage": 84.48, "elapsed_time": "0:55:05", "remaining_time": "0:10:07", "throughput": 5657.25, "total_tokens": 18701864} {"current_steps": 28660, "total_steps": 33920, "loss": 0.2998, "lr": 7.150647899034252e-07, "epoch": 16.89858490566038, "percentage": 84.49, "elapsed_time": "0:55:06", "remaining_time": "0:10:06", "throughput": 5657.1, "total_tokens": 18704424} {"current_steps": 28665, "total_steps": 33920, "loss": 0.3218, "lr": 7.13739539956525e-07, "epoch": 16.901533018867923, "percentage": 84.51, "elapsed_time": "0:55:06", "remaining_time": "0:10:06", "throughput": 5657.18, "total_tokens": 18707720} {"current_steps": 28670, "total_steps": 33920, "loss": 0.3398, "lr": 7.124154248155562e-07, "epoch": 16.90448113207547, "percentage": 84.52, "elapsed_time": "0:55:07", "remaining_time": "0:10:05", "throughput": 5657.47, "total_tokens": 18713576} {"current_steps": 28675, "total_steps": 33920, "loss": 0.3325, "lr": 7.110924448310813e-07, "epoch": 16.90742924528302, "percentage": 84.54, "elapsed_time": "0:55:08", "remaining_time": "0:10:05", "throughput": 5657.45, "total_tokens": 18716232} {"current_steps": 28680, "total_steps": 33920, "loss": 0.2167, "lr": 7.097706003533666e-07, "epoch": 16.910377358490567, "percentage": 84.55, "elapsed_time": "0:55:08", "remaining_time": "0:10:04", "throughput": 5657.52, "total_tokens": 18719432} {"current_steps": 28685, "total_steps": 33920, "loss": 0.3636, "lr": 7.084498917323751e-07, "epoch": 16.913325471698112, "percentage": 84.57, "elapsed_time": "0:55:09", "remaining_time": "0:10:03", "throughput": 5657.62, "total_tokens": 18722664} {"current_steps": 28690, "total_steps": 33920, "loss": 0.3266, "lr": 7.071303193177698e-07, "epoch": 16.91627358490566, "percentage": 84.58, "elapsed_time": "0:55:09", "remaining_time": "0:10:03", "throughput": 5657.71, "total_tokens": 18725992} {"current_steps": 28695, "total_steps": 33920, "loss": 0.3559, "lr": 7.058118834589133e-07, "epoch": 16.91922169811321, "percentage": 84.6, "elapsed_time": "0:55:10", "remaining_time": "0:10:02", "throughput": 5657.56, "total_tokens": 18728520} {"current_steps": 28700, "total_steps": 33920, "loss": 0.3259, "lr": 7.044945845048684e-07, "epoch": 16.922169811320753, "percentage": 84.61, "elapsed_time": "0:55:10", "remaining_time": "0:10:02", "throughput": 5657.67, "total_tokens": 18732168} {"current_steps": 28705, "total_steps": 33920, "loss": 0.2902, "lr": 7.031784228043948e-07, "epoch": 16.9251179245283, "percentage": 84.63, "elapsed_time": "0:55:11", "remaining_time": "0:10:01", "throughput": 5657.81, "total_tokens": 18736264} {"current_steps": 28710, "total_steps": 33920, "loss": 0.2599, "lr": 7.01863398705952e-07, "epoch": 16.92806603773585, "percentage": 84.64, "elapsed_time": "0:55:12", "remaining_time": "0:10:01", "throughput": 5657.79, "total_tokens": 18739144} {"current_steps": 28715, "total_steps": 33920, "loss": 0.3527, "lr": 7.005495125576983e-07, "epoch": 16.931014150943398, "percentage": 84.66, "elapsed_time": "0:55:12", "remaining_time": "0:10:00", "throughput": 5658.07, "total_tokens": 18745096} {"current_steps": 28720, "total_steps": 33920, "loss": 0.2285, "lr": 6.99236764707491e-07, "epoch": 16.933962264150942, "percentage": 84.67, "elapsed_time": "0:55:13", "remaining_time": "0:09:59", "throughput": 5657.93, "total_tokens": 18747432} {"current_steps": 28725, "total_steps": 33920, "loss": 0.2431, "lr": 6.979251555028843e-07, "epoch": 16.93691037735849, "percentage": 84.68, "elapsed_time": "0:55:14", "remaining_time": "0:09:59", "throughput": 5658.03, "total_tokens": 18751080} {"current_steps": 28730, "total_steps": 33920, "loss": 0.2945, "lr": 6.966146852911332e-07, "epoch": 16.93985849056604, "percentage": 84.7, "elapsed_time": "0:55:14", "remaining_time": "0:09:58", "throughput": 5657.96, "total_tokens": 18753672} {"current_steps": 28735, "total_steps": 33920, "loss": 0.2463, "lr": 6.953053544191923e-07, "epoch": 16.942806603773583, "percentage": 84.71, "elapsed_time": "0:55:15", "remaining_time": "0:09:58", "throughput": 5657.97, "total_tokens": 18757032} {"current_steps": 28740, "total_steps": 33920, "loss": 0.3649, "lr": 6.939971632337111e-07, "epoch": 16.94575471698113, "percentage": 84.73, "elapsed_time": "0:55:15", "remaining_time": "0:09:57", "throughput": 5658.06, "total_tokens": 18760744} {"current_steps": 28745, "total_steps": 33920, "loss": 0.3169, "lr": 6.926901120810387e-07, "epoch": 16.94870283018868, "percentage": 84.74, "elapsed_time": "0:55:16", "remaining_time": "0:09:57", "throughput": 5658.16, "total_tokens": 18764072} {"current_steps": 28750, "total_steps": 33920, "loss": 0.2927, "lr": 6.91384201307222e-07, "epoch": 16.951650943396228, "percentage": 84.76, "elapsed_time": "0:55:16", "remaining_time": "0:09:56", "throughput": 5658.28, "total_tokens": 18767496} {"current_steps": 28755, "total_steps": 33920, "loss": 0.4488, "lr": 6.900794312580078e-07, "epoch": 16.954599056603772, "percentage": 84.77, "elapsed_time": "0:55:17", "remaining_time": "0:09:55", "throughput": 5658.38, "total_tokens": 18771240} {"current_steps": 28760, "total_steps": 33920, "loss": 0.2602, "lr": 6.887758022788377e-07, "epoch": 16.95754716981132, "percentage": 84.79, "elapsed_time": "0:55:17", "remaining_time": "0:09:55", "throughput": 5658.38, "total_tokens": 18774312} {"current_steps": 28765, "total_steps": 33920, "loss": 0.2412, "lr": 6.874733147148549e-07, "epoch": 16.96049528301887, "percentage": 84.8, "elapsed_time": "0:55:18", "remaining_time": "0:09:54", "throughput": 5658.62, "total_tokens": 18779272} {"current_steps": 28770, "total_steps": 33920, "loss": 0.311, "lr": 6.861719689108987e-07, "epoch": 16.963443396226417, "percentage": 84.82, "elapsed_time": "0:55:19", "remaining_time": "0:09:54", "throughput": 5658.67, "total_tokens": 18782408} {"current_steps": 28775, "total_steps": 33920, "loss": 0.3793, "lr": 6.84871765211505e-07, "epoch": 16.96639150943396, "percentage": 84.83, "elapsed_time": "0:55:19", "remaining_time": "0:09:53", "throughput": 5658.63, "total_tokens": 18785096} {"current_steps": 28780, "total_steps": 33920, "loss": 0.3615, "lr": 6.835727039609086e-07, "epoch": 16.96933962264151, "percentage": 84.85, "elapsed_time": "0:55:20", "remaining_time": "0:09:52", "throughput": 5658.77, "total_tokens": 18788680} {"current_steps": 28785, "total_steps": 33920, "loss": 0.38, "lr": 6.822747855030415e-07, "epoch": 16.972287735849058, "percentage": 84.86, "elapsed_time": "0:55:20", "remaining_time": "0:09:52", "throughput": 5658.73, "total_tokens": 18791592} {"current_steps": 28790, "total_steps": 33920, "loss": 0.4038, "lr": 6.809780101815322e-07, "epoch": 16.975235849056602, "percentage": 84.88, "elapsed_time": "0:55:21", "remaining_time": "0:09:51", "throughput": 5658.65, "total_tokens": 18794248} {"current_steps": 28795, "total_steps": 33920, "loss": 0.2689, "lr": 6.796823783397099e-07, "epoch": 16.97818396226415, "percentage": 84.89, "elapsed_time": "0:55:21", "remaining_time": "0:09:51", "throughput": 5658.6, "total_tokens": 18797032} {"current_steps": 28800, "total_steps": 33920, "loss": 0.3077, "lr": 6.783878903205976e-07, "epoch": 16.9811320754717, "percentage": 84.91, "elapsed_time": "0:55:22", "remaining_time": "0:09:50", "throughput": 5658.61, "total_tokens": 18800552} {"current_steps": 28805, "total_steps": 33920, "loss": 0.3135, "lr": 6.77094546466916e-07, "epoch": 16.984080188679247, "percentage": 84.92, "elapsed_time": "0:55:22", "remaining_time": "0:09:50", "throughput": 5658.61, "total_tokens": 18803304} {"current_steps": 28810, "total_steps": 33920, "loss": 0.2349, "lr": 6.758023471210845e-07, "epoch": 16.98702830188679, "percentage": 84.94, "elapsed_time": "0:55:23", "remaining_time": "0:09:49", "throughput": 5658.62, "total_tokens": 18806440} {"current_steps": 28815, "total_steps": 33920, "loss": 0.3146, "lr": 6.745112926252162e-07, "epoch": 16.98997641509434, "percentage": 84.95, "elapsed_time": "0:55:24", "remaining_time": "0:09:48", "throughput": 5658.69, "total_tokens": 18809512} {"current_steps": 28820, "total_steps": 33920, "loss": 0.3026, "lr": 6.732213833211265e-07, "epoch": 16.992924528301888, "percentage": 84.96, "elapsed_time": "0:55:24", "remaining_time": "0:09:48", "throughput": 5658.83, "total_tokens": 18813544} {"current_steps": 28825, "total_steps": 33920, "loss": 0.3043, "lr": 6.719326195503218e-07, "epoch": 16.995872641509433, "percentage": 84.98, "elapsed_time": "0:55:25", "remaining_time": "0:09:47", "throughput": 5658.78, "total_tokens": 18816200} {"current_steps": 28830, "total_steps": 33920, "loss": 0.3289, "lr": 6.706450016540094e-07, "epoch": 16.99882075471698, "percentage": 84.99, "elapsed_time": "0:55:25", "remaining_time": "0:09:47", "throughput": 5658.52, "total_tokens": 18818120} {"current_steps": 28835, "total_steps": 33920, "loss": 0.4684, "lr": 6.69358529973092e-07, "epoch": 17.00176886792453, "percentage": 85.01, "elapsed_time": "0:55:26", "remaining_time": "0:09:46", "throughput": 5657.83, "total_tokens": 18820560} {"current_steps": 28840, "total_steps": 33920, "loss": 0.2389, "lr": 6.680732048481681e-07, "epoch": 17.004716981132077, "percentage": 85.02, "elapsed_time": "0:55:26", "remaining_time": "0:09:46", "throughput": 5657.83, "total_tokens": 18823376} {"current_steps": 28845, "total_steps": 33920, "loss": 0.2828, "lr": 6.667890266195321e-07, "epoch": 17.00766509433962, "percentage": 85.04, "elapsed_time": "0:55:27", "remaining_time": "0:09:45", "throughput": 5657.8, "total_tokens": 18826320} {"current_steps": 28850, "total_steps": 33920, "loss": 0.4073, "lr": 6.655059956271759e-07, "epoch": 17.01061320754717, "percentage": 85.05, "elapsed_time": "0:55:28", "remaining_time": "0:09:44", "throughput": 5657.77, "total_tokens": 18829392} {"current_steps": 28855, "total_steps": 33920, "loss": 0.2946, "lr": 6.642241122107884e-07, "epoch": 17.013561320754718, "percentage": 85.07, "elapsed_time": "0:55:28", "remaining_time": "0:09:44", "throughput": 5657.78, "total_tokens": 18832880} {"current_steps": 28860, "total_steps": 33920, "loss": 0.4036, "lr": 6.629433767097537e-07, "epoch": 17.016509433962263, "percentage": 85.08, "elapsed_time": "0:55:29", "remaining_time": "0:09:43", "throughput": 5657.75, "total_tokens": 18835600} {"current_steps": 28865, "total_steps": 33920, "loss": 0.2604, "lr": 6.616637894631517e-07, "epoch": 17.01945754716981, "percentage": 85.1, "elapsed_time": "0:55:29", "remaining_time": "0:09:43", "throughput": 5657.73, "total_tokens": 18838384} {"current_steps": 28870, "total_steps": 33920, "loss": 0.3213, "lr": 6.603853508097591e-07, "epoch": 17.02240566037736, "percentage": 85.11, "elapsed_time": "0:55:30", "remaining_time": "0:09:42", "throughput": 5657.69, "total_tokens": 18841360} {"current_steps": 28875, "total_steps": 33920, "loss": 0.2987, "lr": 6.591080610880468e-07, "epoch": 17.025353773584907, "percentage": 85.13, "elapsed_time": "0:55:30", "remaining_time": "0:09:41", "throughput": 5657.71, "total_tokens": 18844464} {"current_steps": 28880, "total_steps": 33920, "loss": 0.2957, "lr": 6.578319206361828e-07, "epoch": 17.028301886792452, "percentage": 85.14, "elapsed_time": "0:55:31", "remaining_time": "0:09:41", "throughput": 5657.79, "total_tokens": 18847632} {"current_steps": 28885, "total_steps": 33920, "loss": 0.2527, "lr": 6.565569297920327e-07, "epoch": 17.03125, "percentage": 85.16, "elapsed_time": "0:55:31", "remaining_time": "0:09:40", "throughput": 5657.83, "total_tokens": 18850832} {"current_steps": 28890, "total_steps": 33920, "loss": 0.3308, "lr": 6.552830888931544e-07, "epoch": 17.034198113207548, "percentage": 85.17, "elapsed_time": "0:55:32", "remaining_time": "0:09:40", "throughput": 5657.97, "total_tokens": 18855088} {"current_steps": 28895, "total_steps": 33920, "loss": 0.3567, "lr": 6.540103982768031e-07, "epoch": 17.037146226415093, "percentage": 85.19, "elapsed_time": "0:55:33", "remaining_time": "0:09:39", "throughput": 5658.15, "total_tokens": 18859024} {"current_steps": 28900, "total_steps": 33920, "loss": 0.3168, "lr": 6.527388582799293e-07, "epoch": 17.04009433962264, "percentage": 85.2, "elapsed_time": "0:55:33", "remaining_time": "0:09:39", "throughput": 5658.3, "total_tokens": 18862768} {"current_steps": 28905, "total_steps": 33920, "loss": 0.336, "lr": 6.514684692391782e-07, "epoch": 17.04304245283019, "percentage": 85.22, "elapsed_time": "0:55:34", "remaining_time": "0:09:38", "throughput": 5658.4, "total_tokens": 18866448} {"current_steps": 28910, "total_steps": 33920, "loss": 0.28, "lr": 6.501992314908895e-07, "epoch": 17.045990566037737, "percentage": 85.23, "elapsed_time": "0:55:34", "remaining_time": "0:09:37", "throughput": 5658.34, "total_tokens": 18869200} {"current_steps": 28915, "total_steps": 33920, "loss": 0.2487, "lr": 6.489311453711017e-07, "epoch": 17.048938679245282, "percentage": 85.24, "elapsed_time": "0:55:35", "remaining_time": "0:09:37", "throughput": 5658.25, "total_tokens": 18871792} {"current_steps": 28920, "total_steps": 33920, "loss": 0.3703, "lr": 6.476642112155457e-07, "epoch": 17.05188679245283, "percentage": 85.26, "elapsed_time": "0:55:35", "remaining_time": "0:09:36", "throughput": 5658.46, "total_tokens": 18875824} {"current_steps": 28925, "total_steps": 33920, "loss": 0.3144, "lr": 6.463984293596476e-07, "epoch": 17.05483490566038, "percentage": 85.27, "elapsed_time": "0:55:36", "remaining_time": "0:09:36", "throughput": 5658.4, "total_tokens": 18878384} {"current_steps": 28930, "total_steps": 33920, "loss": 0.2724, "lr": 6.451338001385282e-07, "epoch": 17.057783018867923, "percentage": 85.29, "elapsed_time": "0:55:36", "remaining_time": "0:09:35", "throughput": 5658.37, "total_tokens": 18881584} {"current_steps": 28935, "total_steps": 33920, "loss": 0.3482, "lr": 6.438703238870037e-07, "epoch": 17.06073113207547, "percentage": 85.3, "elapsed_time": "0:55:37", "remaining_time": "0:09:35", "throughput": 5658.59, "total_tokens": 18885808} {"current_steps": 28940, "total_steps": 33920, "loss": 0.2442, "lr": 6.426080009395846e-07, "epoch": 17.06367924528302, "percentage": 85.32, "elapsed_time": "0:55:38", "remaining_time": "0:09:34", "throughput": 5658.6, "total_tokens": 18889680} {"current_steps": 28945, "total_steps": 33920, "loss": 0.3201, "lr": 6.413468316304755e-07, "epoch": 17.066627358490567, "percentage": 85.33, "elapsed_time": "0:55:38", "remaining_time": "0:09:33", "throughput": 5658.67, "total_tokens": 18893200} {"current_steps": 28950, "total_steps": 33920, "loss": 0.298, "lr": 6.400868162935786e-07, "epoch": 17.069575471698112, "percentage": 85.35, "elapsed_time": "0:55:39", "remaining_time": "0:09:33", "throughput": 5658.73, "total_tokens": 18896496} {"current_steps": 28955, "total_steps": 33920, "loss": 0.3733, "lr": 6.388279552624877e-07, "epoch": 17.07252358490566, "percentage": 85.36, "elapsed_time": "0:55:39", "remaining_time": "0:09:32", "throughput": 5658.88, "total_tokens": 18900528} {"current_steps": 28960, "total_steps": 33920, "loss": 0.3959, "lr": 6.37570248870491e-07, "epoch": 17.07547169811321, "percentage": 85.38, "elapsed_time": "0:55:40", "remaining_time": "0:09:32", "throughput": 5658.9, "total_tokens": 18903664} {"current_steps": 28965, "total_steps": 33920, "loss": 0.2677, "lr": 6.363136974505718e-07, "epoch": 17.078419811320753, "percentage": 85.39, "elapsed_time": "0:55:41", "remaining_time": "0:09:31", "throughput": 5658.98, "total_tokens": 18907216} {"current_steps": 28970, "total_steps": 33920, "loss": 0.3265, "lr": 6.350583013354078e-07, "epoch": 17.0813679245283, "percentage": 85.41, "elapsed_time": "0:55:41", "remaining_time": "0:09:30", "throughput": 5659.14, "total_tokens": 18910992} {"current_steps": 28975, "total_steps": 33920, "loss": 0.3975, "lr": 6.338040608573693e-07, "epoch": 17.08431603773585, "percentage": 85.42, "elapsed_time": "0:55:42", "remaining_time": "0:09:30", "throughput": 5659.31, "total_tokens": 18914736} {"current_steps": 28980, "total_steps": 33920, "loss": 0.4356, "lr": 6.325509763485238e-07, "epoch": 17.087264150943398, "percentage": 85.44, "elapsed_time": "0:55:42", "remaining_time": "0:09:29", "throughput": 5659.3, "total_tokens": 18917680} {"current_steps": 28985, "total_steps": 33920, "loss": 0.422, "lr": 6.312990481406301e-07, "epoch": 17.090212264150942, "percentage": 85.45, "elapsed_time": "0:55:43", "remaining_time": "0:09:29", "throughput": 5659.36, "total_tokens": 18921104} {"current_steps": 28990, "total_steps": 33920, "loss": 0.3194, "lr": 6.300482765651411e-07, "epoch": 17.09316037735849, "percentage": 85.47, "elapsed_time": "0:55:43", "remaining_time": "0:09:28", "throughput": 5659.29, "total_tokens": 18923632} {"current_steps": 28995, "total_steps": 33920, "loss": 0.3847, "lr": 6.28798661953205e-07, "epoch": 17.09610849056604, "percentage": 85.48, "elapsed_time": "0:55:44", "remaining_time": "0:09:28", "throughput": 5659.42, "total_tokens": 18927440} {"current_steps": 29000, "total_steps": 33920, "loss": 0.3914, "lr": 6.275502046356618e-07, "epoch": 17.099056603773583, "percentage": 85.5, "elapsed_time": "0:55:44", "remaining_time": "0:09:27", "throughput": 5659.5, "total_tokens": 18930896} {"current_steps": 29005, "total_steps": 33920, "loss": 0.4015, "lr": 6.263029049430447e-07, "epoch": 17.10200471698113, "percentage": 85.51, "elapsed_time": "0:55:45", "remaining_time": "0:09:26", "throughput": 5659.37, "total_tokens": 18933680} {"current_steps": 29010, "total_steps": 33920, "loss": 0.2719, "lr": 6.250567632055832e-07, "epoch": 17.10495283018868, "percentage": 85.52, "elapsed_time": "0:55:46", "remaining_time": "0:09:26", "throughput": 5659.48, "total_tokens": 18937200} {"current_steps": 29015, "total_steps": 33920, "loss": 0.2425, "lr": 6.238117797532e-07, "epoch": 17.107900943396228, "percentage": 85.54, "elapsed_time": "0:55:46", "remaining_time": "0:09:25", "throughput": 5659.58, "total_tokens": 18940976} {"current_steps": 29020, "total_steps": 33920, "loss": 0.2221, "lr": 6.225679549155083e-07, "epoch": 17.110849056603772, "percentage": 85.55, "elapsed_time": "0:55:47", "remaining_time": "0:09:25", "throughput": 5659.5, "total_tokens": 18943472} {"current_steps": 29025, "total_steps": 33920, "loss": 0.4864, "lr": 6.213252890218163e-07, "epoch": 17.11379716981132, "percentage": 85.57, "elapsed_time": "0:55:47", "remaining_time": "0:09:24", "throughput": 5659.59, "total_tokens": 18946608} {"current_steps": 29030, "total_steps": 33920, "loss": 0.2447, "lr": 6.200837824011247e-07, "epoch": 17.11674528301887, "percentage": 85.58, "elapsed_time": "0:55:48", "remaining_time": "0:09:23", "throughput": 5659.53, "total_tokens": 18949232} {"current_steps": 29035, "total_steps": 33920, "loss": 0.283, "lr": 6.188434353821282e-07, "epoch": 17.119693396226417, "percentage": 85.6, "elapsed_time": "0:55:48", "remaining_time": "0:09:23", "throughput": 5659.69, "total_tokens": 18953040} {"current_steps": 29040, "total_steps": 33920, "loss": 0.3229, "lr": 6.176042482932132e-07, "epoch": 17.12264150943396, "percentage": 85.61, "elapsed_time": "0:55:49", "remaining_time": "0:09:22", "throughput": 5659.72, "total_tokens": 18956144} {"current_steps": 29045, "total_steps": 33920, "loss": 0.3138, "lr": 6.163662214624616e-07, "epoch": 17.12558962264151, "percentage": 85.63, "elapsed_time": "0:55:49", "remaining_time": "0:09:22", "throughput": 5659.68, "total_tokens": 18959312} {"current_steps": 29050, "total_steps": 33920, "loss": 0.29, "lr": 6.151293552176451e-07, "epoch": 17.128537735849058, "percentage": 85.64, "elapsed_time": "0:55:50", "remaining_time": "0:09:21", "throughput": 5659.66, "total_tokens": 18962384} {"current_steps": 29055, "total_steps": 33920, "loss": 0.3089, "lr": 6.138936498862291e-07, "epoch": 17.131485849056602, "percentage": 85.66, "elapsed_time": "0:55:51", "remaining_time": "0:09:21", "throughput": 5659.74, "total_tokens": 18965936} {"current_steps": 29060, "total_steps": 33920, "loss": 0.3179, "lr": 6.126591057953729e-07, "epoch": 17.13443396226415, "percentage": 85.67, "elapsed_time": "0:55:51", "remaining_time": "0:09:20", "throughput": 5659.82, "total_tokens": 18969488} {"current_steps": 29065, "total_steps": 33920, "loss": 0.2565, "lr": 6.114257232719267e-07, "epoch": 17.1373820754717, "percentage": 85.69, "elapsed_time": "0:55:52", "remaining_time": "0:09:19", "throughput": 5659.67, "total_tokens": 18971792} {"current_steps": 29070, "total_steps": 33920, "loss": 0.411, "lr": 6.101935026424332e-07, "epoch": 17.140330188679247, "percentage": 85.7, "elapsed_time": "0:55:52", "remaining_time": "0:09:19", "throughput": 5659.77, "total_tokens": 18975312} {"current_steps": 29075, "total_steps": 33920, "loss": 0.3314, "lr": 6.089624442331293e-07, "epoch": 17.14327830188679, "percentage": 85.72, "elapsed_time": "0:55:53", "remaining_time": "0:09:18", "throughput": 5659.71, "total_tokens": 18977968} {"current_steps": 29080, "total_steps": 33920, "loss": 0.296, "lr": 6.077325483699432e-07, "epoch": 17.14622641509434, "percentage": 85.73, "elapsed_time": "0:55:53", "remaining_time": "0:09:18", "throughput": 5659.57, "total_tokens": 18980432} {"current_steps": 29085, "total_steps": 33920, "loss": 0.237, "lr": 6.065038153784947e-07, "epoch": 17.149174528301888, "percentage": 85.75, "elapsed_time": "0:55:54", "remaining_time": "0:09:17", "throughput": 5659.58, "total_tokens": 18983216} {"current_steps": 29090, "total_steps": 33920, "loss": 0.2683, "lr": 6.052762455840955e-07, "epoch": 17.152122641509433, "percentage": 85.76, "elapsed_time": "0:55:54", "remaining_time": "0:09:17", "throughput": 5659.7, "total_tokens": 18986672} {"current_steps": 29095, "total_steps": 33920, "loss": 0.2812, "lr": 6.040498393117494e-07, "epoch": 17.15507075471698, "percentage": 85.78, "elapsed_time": "0:55:55", "remaining_time": "0:09:16", "throughput": 5659.76, "total_tokens": 18990000} {"current_steps": 29100, "total_steps": 33920, "loss": 0.2802, "lr": 6.028245968861551e-07, "epoch": 17.15801886792453, "percentage": 85.79, "elapsed_time": "0:55:55", "remaining_time": "0:09:15", "throughput": 5659.9, "total_tokens": 18994000} {"current_steps": 29105, "total_steps": 33920, "loss": 0.3364, "lr": 6.016005186316987e-07, "epoch": 17.160966981132077, "percentage": 85.8, "elapsed_time": "0:55:56", "remaining_time": "0:09:15", "throughput": 5659.95, "total_tokens": 18997136} {"current_steps": 29110, "total_steps": 33920, "loss": 0.3032, "lr": 6.003776048724614e-07, "epoch": 17.16391509433962, "percentage": 85.82, "elapsed_time": "0:55:56", "remaining_time": "0:09:14", "throughput": 5659.91, "total_tokens": 19000208} {"current_steps": 29115, "total_steps": 33920, "loss": 0.246, "lr": 5.991558559322152e-07, "epoch": 17.16686320754717, "percentage": 85.83, "elapsed_time": "0:55:57", "remaining_time": "0:09:14", "throughput": 5659.75, "total_tokens": 19002736} {"current_steps": 29120, "total_steps": 33920, "loss": 0.3158, "lr": 5.979352721344223e-07, "epoch": 17.169811320754718, "percentage": 85.85, "elapsed_time": "0:55:58", "remaining_time": "0:09:13", "throughput": 5659.87, "total_tokens": 19006480} {"current_steps": 29125, "total_steps": 33920, "loss": 0.2779, "lr": 5.967158538022383e-07, "epoch": 17.172759433962263, "percentage": 85.86, "elapsed_time": "0:55:58", "remaining_time": "0:09:12", "throughput": 5660.01, "total_tokens": 19010416} {"current_steps": 29130, "total_steps": 33920, "loss": 0.2406, "lr": 5.954976012585078e-07, "epoch": 17.17570754716981, "percentage": 85.88, "elapsed_time": "0:55:59", "remaining_time": "0:09:12", "throughput": 5660.0, "total_tokens": 19013552} {"current_steps": 29135, "total_steps": 33920, "loss": 0.2935, "lr": 5.942805148257713e-07, "epoch": 17.17865566037736, "percentage": 85.89, "elapsed_time": "0:55:59", "remaining_time": "0:09:11", "throughput": 5660.19, "total_tokens": 19017328} {"current_steps": 29140, "total_steps": 33920, "loss": 0.4511, "lr": 5.930645948262553e-07, "epoch": 17.181603773584907, "percentage": 85.91, "elapsed_time": "0:56:00", "remaining_time": "0:09:11", "throughput": 5660.27, "total_tokens": 19020816} {"current_steps": 29145, "total_steps": 33920, "loss": 0.2451, "lr": 5.918498415818813e-07, "epoch": 17.184551886792452, "percentage": 85.92, "elapsed_time": "0:56:00", "remaining_time": "0:09:10", "throughput": 5660.23, "total_tokens": 19023408} {"current_steps": 29150, "total_steps": 33920, "loss": 0.271, "lr": 5.906362554142592e-07, "epoch": 17.1875, "percentage": 85.94, "elapsed_time": "0:56:01", "remaining_time": "0:09:10", "throughput": 5660.25, "total_tokens": 19026416} {"current_steps": 29155, "total_steps": 33920, "loss": 0.2569, "lr": 5.894238366446925e-07, "epoch": 17.190448113207548, "percentage": 85.95, "elapsed_time": "0:56:01", "remaining_time": "0:09:09", "throughput": 5660.25, "total_tokens": 19029168} {"current_steps": 29160, "total_steps": 33920, "loss": 0.2518, "lr": 5.882125855941723e-07, "epoch": 17.193396226415093, "percentage": 85.97, "elapsed_time": "0:56:02", "remaining_time": "0:09:08", "throughput": 5660.31, "total_tokens": 19032912} {"current_steps": 29165, "total_steps": 33920, "loss": 0.3503, "lr": 5.870025025833842e-07, "epoch": 17.19634433962264, "percentage": 85.98, "elapsed_time": "0:56:03", "remaining_time": "0:09:08", "throughput": 5660.18, "total_tokens": 19035472} {"current_steps": 29170, "total_steps": 33920, "loss": 0.2846, "lr": 5.857935879327031e-07, "epoch": 17.19929245283019, "percentage": 86.0, "elapsed_time": "0:56:03", "remaining_time": "0:09:07", "throughput": 5660.3, "total_tokens": 19039408} {"current_steps": 29175, "total_steps": 33920, "loss": 0.298, "lr": 5.845858419621936e-07, "epoch": 17.202240566037737, "percentage": 86.01, "elapsed_time": "0:56:04", "remaining_time": "0:09:07", "throughput": 5660.31, "total_tokens": 19042384} {"current_steps": 29180, "total_steps": 33920, "loss": 0.3781, "lr": 5.83379264991612e-07, "epoch": 17.205188679245282, "percentage": 86.03, "elapsed_time": "0:56:04", "remaining_time": "0:09:06", "throughput": 5660.38, "total_tokens": 19045648} {"current_steps": 29185, "total_steps": 33920, "loss": 0.4946, "lr": 5.821738573404046e-07, "epoch": 17.20813679245283, "percentage": 86.04, "elapsed_time": "0:56:05", "remaining_time": "0:09:05", "throughput": 5660.45, "total_tokens": 19049136} {"current_steps": 29190, "total_steps": 33920, "loss": 0.2932, "lr": 5.80969619327707e-07, "epoch": 17.21108490566038, "percentage": 86.06, "elapsed_time": "0:56:05", "remaining_time": "0:09:05", "throughput": 5660.39, "total_tokens": 19051728} {"current_steps": 29195, "total_steps": 33920, "loss": 0.2857, "lr": 5.797665512723488e-07, "epoch": 17.214033018867923, "percentage": 86.07, "elapsed_time": "0:56:06", "remaining_time": "0:09:04", "throughput": 5660.56, "total_tokens": 19055728} {"current_steps": 29200, "total_steps": 33920, "loss": 0.3064, "lr": 5.785646534928452e-07, "epoch": 17.21698113207547, "percentage": 86.08, "elapsed_time": "0:56:06", "remaining_time": "0:09:04", "throughput": 5660.62, "total_tokens": 19058832} {"current_steps": 29205, "total_steps": 33920, "loss": 0.2681, "lr": 5.77363926307406e-07, "epoch": 17.21992924528302, "percentage": 86.1, "elapsed_time": "0:56:07", "remaining_time": "0:09:03", "throughput": 5660.77, "total_tokens": 19062608} {"current_steps": 29210, "total_steps": 33920, "loss": 0.297, "lr": 5.761643700339281e-07, "epoch": 17.222877358490567, "percentage": 86.11, "elapsed_time": "0:56:08", "remaining_time": "0:09:03", "throughput": 5660.87, "total_tokens": 19066320} {"current_steps": 29215, "total_steps": 33920, "loss": 0.3395, "lr": 5.749659849899985e-07, "epoch": 17.225825471698112, "percentage": 86.13, "elapsed_time": "0:56:08", "remaining_time": "0:09:02", "throughput": 5660.88, "total_tokens": 19069136} {"current_steps": 29220, "total_steps": 33920, "loss": 0.3699, "lr": 5.737687714928953e-07, "epoch": 17.22877358490566, "percentage": 86.14, "elapsed_time": "0:56:09", "remaining_time": "0:09:01", "throughput": 5660.95, "total_tokens": 19072496} {"current_steps": 29225, "total_steps": 33920, "loss": 0.3469, "lr": 5.725727298595846e-07, "epoch": 17.23172169811321, "percentage": 86.16, "elapsed_time": "0:56:09", "remaining_time": "0:09:01", "throughput": 5660.95, "total_tokens": 19075440} {"current_steps": 29230, "total_steps": 33920, "loss": 0.3471, "lr": 5.71377860406726e-07, "epoch": 17.234669811320753, "percentage": 86.17, "elapsed_time": "0:56:10", "remaining_time": "0:09:00", "throughput": 5661.14, "total_tokens": 19079728} {"current_steps": 29235, "total_steps": 33920, "loss": 0.3067, "lr": 5.701841634506655e-07, "epoch": 17.2376179245283, "percentage": 86.19, "elapsed_time": "0:56:10", "remaining_time": "0:09:00", "throughput": 5661.13, "total_tokens": 19082640} {"current_steps": 29240, "total_steps": 33920, "loss": 0.3328, "lr": 5.689916393074391e-07, "epoch": 17.24056603773585, "percentage": 86.2, "elapsed_time": "0:56:11", "remaining_time": "0:08:59", "throughput": 5661.07, "total_tokens": 19085456} {"current_steps": 29245, "total_steps": 33920, "loss": 0.4058, "lr": 5.678002882927725e-07, "epoch": 17.243514150943398, "percentage": 86.22, "elapsed_time": "0:56:11", "remaining_time": "0:08:59", "throughput": 5660.98, "total_tokens": 19088304} {"current_steps": 29250, "total_steps": 33920, "loss": 0.2134, "lr": 5.666101107220811e-07, "epoch": 17.246462264150942, "percentage": 86.23, "elapsed_time": "0:56:12", "remaining_time": "0:08:58", "throughput": 5660.83, "total_tokens": 19090672} {"current_steps": 29255, "total_steps": 33920, "loss": 0.2583, "lr": 5.654211069104693e-07, "epoch": 17.24941037735849, "percentage": 86.25, "elapsed_time": "0:56:13", "remaining_time": "0:08:57", "throughput": 5660.82, "total_tokens": 19094000} {"current_steps": 29260, "total_steps": 33920, "loss": 0.2633, "lr": 5.642332771727321e-07, "epoch": 17.25235849056604, "percentage": 86.26, "elapsed_time": "0:56:13", "remaining_time": "0:08:57", "throughput": 5660.89, "total_tokens": 19097040} {"current_steps": 29265, "total_steps": 33920, "loss": 0.4488, "lr": 5.630466218233521e-07, "epoch": 17.255306603773583, "percentage": 86.28, "elapsed_time": "0:56:14", "remaining_time": "0:08:56", "throughput": 5660.87, "total_tokens": 19099984} {"current_steps": 29270, "total_steps": 33920, "loss": 0.3237, "lr": 5.618611411765007e-07, "epoch": 17.25825471698113, "percentage": 86.29, "elapsed_time": "0:56:14", "remaining_time": "0:08:56", "throughput": 5660.76, "total_tokens": 19102576} {"current_steps": 29275, "total_steps": 33920, "loss": 0.2747, "lr": 5.606768355460401e-07, "epoch": 17.26120283018868, "percentage": 86.31, "elapsed_time": "0:56:15", "remaining_time": "0:08:55", "throughput": 5660.76, "total_tokens": 19105648} {"current_steps": 29280, "total_steps": 33920, "loss": 0.2793, "lr": 5.594937052455191e-07, "epoch": 17.264150943396228, "percentage": 86.32, "elapsed_time": "0:56:15", "remaining_time": "0:08:54", "throughput": 5660.73, "total_tokens": 19108432} {"current_steps": 29285, "total_steps": 33920, "loss": 0.2991, "lr": 5.583117505881764e-07, "epoch": 17.267099056603772, "percentage": 86.34, "elapsed_time": "0:56:16", "remaining_time": "0:08:54", "throughput": 5660.87, "total_tokens": 19112496} {"current_steps": 29290, "total_steps": 33920, "loss": 0.2687, "lr": 5.571309718869417e-07, "epoch": 17.27004716981132, "percentage": 86.35, "elapsed_time": "0:56:16", "remaining_time": "0:08:53", "throughput": 5660.98, "total_tokens": 19116528} {"current_steps": 29295, "total_steps": 33920, "loss": 0.2841, "lr": 5.559513694544282e-07, "epoch": 17.27299528301887, "percentage": 86.36, "elapsed_time": "0:56:17", "remaining_time": "0:08:53", "throughput": 5661.0, "total_tokens": 19119664} {"current_steps": 29300, "total_steps": 33920, "loss": 0.3022, "lr": 5.547729436029442e-07, "epoch": 17.275943396226417, "percentage": 86.38, "elapsed_time": "0:56:17", "remaining_time": "0:08:52", "throughput": 5660.94, "total_tokens": 19122320} {"current_steps": 29305, "total_steps": 33920, "loss": 0.3635, "lr": 5.535956946444809e-07, "epoch": 17.27889150943396, "percentage": 86.39, "elapsed_time": "0:56:18", "remaining_time": "0:08:52", "throughput": 5661.04, "total_tokens": 19126096} {"current_steps": 29310, "total_steps": 33920, "loss": 0.351, "lr": 5.524196228907203e-07, "epoch": 17.28183962264151, "percentage": 86.41, "elapsed_time": "0:56:19", "remaining_time": "0:08:51", "throughput": 5661.26, "total_tokens": 19130608} {"current_steps": 29315, "total_steps": 33920, "loss": 0.4131, "lr": 5.512447286530326e-07, "epoch": 17.284787735849058, "percentage": 86.42, "elapsed_time": "0:56:19", "remaining_time": "0:08:50", "throughput": 5661.46, "total_tokens": 19134832} {"current_steps": 29320, "total_steps": 33920, "loss": 0.334, "lr": 5.500710122424746e-07, "epoch": 17.287735849056602, "percentage": 86.44, "elapsed_time": "0:56:20", "remaining_time": "0:08:50", "throughput": 5661.51, "total_tokens": 19138064} {"current_steps": 29325, "total_steps": 33920, "loss": 0.2652, "lr": 5.488984739697961e-07, "epoch": 17.29068396226415, "percentage": 86.45, "elapsed_time": "0:56:20", "remaining_time": "0:08:49", "throughput": 5661.34, "total_tokens": 19140528} {"current_steps": 29330, "total_steps": 33920, "loss": 0.3746, "lr": 5.477271141454294e-07, "epoch": 17.2936320754717, "percentage": 86.47, "elapsed_time": "0:56:21", "remaining_time": "0:08:49", "throughput": 5661.36, "total_tokens": 19143600} {"current_steps": 29335, "total_steps": 33920, "loss": 0.251, "lr": 5.465569330794974e-07, "epoch": 17.296580188679247, "percentage": 86.48, "elapsed_time": "0:56:22", "remaining_time": "0:08:48", "throughput": 5661.4, "total_tokens": 19146960} {"current_steps": 29340, "total_steps": 33920, "loss": 0.3181, "lr": 5.453879310818105e-07, "epoch": 17.29952830188679, "percentage": 86.5, "elapsed_time": "0:56:22", "remaining_time": "0:08:48", "throughput": 5661.3, "total_tokens": 19149488} {"current_steps": 29345, "total_steps": 33920, "loss": 0.2449, "lr": 5.442201084618664e-07, "epoch": 17.30247641509434, "percentage": 86.51, "elapsed_time": "0:56:23", "remaining_time": "0:08:47", "throughput": 5661.2, "total_tokens": 19152464} {"current_steps": 29350, "total_steps": 33920, "loss": 0.2897, "lr": 5.430534655288528e-07, "epoch": 17.305424528301888, "percentage": 86.53, "elapsed_time": "0:56:23", "remaining_time": "0:08:46", "throughput": 5661.21, "total_tokens": 19155856} {"current_steps": 29355, "total_steps": 33920, "loss": 0.2634, "lr": 5.418880025916428e-07, "epoch": 17.308372641509433, "percentage": 86.54, "elapsed_time": "0:56:24", "remaining_time": "0:08:46", "throughput": 5661.18, "total_tokens": 19158704} {"current_steps": 29360, "total_steps": 33920, "loss": 0.2969, "lr": 5.407237199587973e-07, "epoch": 17.31132075471698, "percentage": 86.56, "elapsed_time": "0:56:24", "remaining_time": "0:08:45", "throughput": 5661.27, "total_tokens": 19162064} {"current_steps": 29365, "total_steps": 33920, "loss": 0.4221, "lr": 5.395606179385654e-07, "epoch": 17.31426886792453, "percentage": 86.57, "elapsed_time": "0:56:25", "remaining_time": "0:08:45", "throughput": 5661.39, "total_tokens": 19165968} {"current_steps": 29370, "total_steps": 33920, "loss": 0.2409, "lr": 5.383986968388833e-07, "epoch": 17.317216981132077, "percentage": 86.59, "elapsed_time": "0:56:25", "remaining_time": "0:08:44", "throughput": 5661.41, "total_tokens": 19169424} {"current_steps": 29375, "total_steps": 33920, "loss": 0.2774, "lr": 5.372379569673736e-07, "epoch": 17.32016509433962, "percentage": 86.6, "elapsed_time": "0:56:26", "remaining_time": "0:08:43", "throughput": 5661.29, "total_tokens": 19172176} {"current_steps": 29380, "total_steps": 33920, "loss": 0.2571, "lr": 5.360783986313495e-07, "epoch": 17.32311320754717, "percentage": 86.62, "elapsed_time": "0:56:27", "remaining_time": "0:08:43", "throughput": 5661.25, "total_tokens": 19175216} {"current_steps": 29385, "total_steps": 33920, "loss": 0.3781, "lr": 5.349200221378076e-07, "epoch": 17.326061320754718, "percentage": 86.63, "elapsed_time": "0:56:27", "remaining_time": "0:08:42", "throughput": 5661.17, "total_tokens": 19177744} {"current_steps": 29390, "total_steps": 33920, "loss": 0.2195, "lr": 5.33762827793432e-07, "epoch": 17.329009433962263, "percentage": 86.65, "elapsed_time": "0:56:28", "remaining_time": "0:08:42", "throughput": 5661.29, "total_tokens": 19181552} {"current_steps": 29395, "total_steps": 33920, "loss": 0.3001, "lr": 5.326068159045978e-07, "epoch": 17.33195754716981, "percentage": 86.66, "elapsed_time": "0:56:28", "remaining_time": "0:08:41", "throughput": 5661.24, "total_tokens": 19184272} {"current_steps": 29400, "total_steps": 33920, "loss": 0.2516, "lr": 5.314519867773621e-07, "epoch": 17.33490566037736, "percentage": 86.67, "elapsed_time": "0:56:29", "remaining_time": "0:08:41", "throughput": 5661.11, "total_tokens": 19186736} {"current_steps": 29405, "total_steps": 33920, "loss": 0.2914, "lr": 5.302983407174711e-07, "epoch": 17.337853773584907, "percentage": 86.69, "elapsed_time": "0:56:29", "remaining_time": "0:08:40", "throughput": 5661.22, "total_tokens": 19190032} {"current_steps": 29410, "total_steps": 33920, "loss": 0.3048, "lr": 5.291458780303572e-07, "epoch": 17.340801886792452, "percentage": 86.7, "elapsed_time": "0:56:30", "remaining_time": "0:08:39", "throughput": 5661.11, "total_tokens": 19192560} {"current_steps": 29415, "total_steps": 33920, "loss": 0.2656, "lr": 5.279945990211411e-07, "epoch": 17.34375, "percentage": 86.72, "elapsed_time": "0:56:30", "remaining_time": "0:08:39", "throughput": 5661.06, "total_tokens": 19195664} {"current_steps": 29420, "total_steps": 33920, "loss": 0.2001, "lr": 5.26844503994628e-07, "epoch": 17.346698113207548, "percentage": 86.73, "elapsed_time": "0:56:31", "remaining_time": "0:08:38", "throughput": 5661.06, "total_tokens": 19198512} {"current_steps": 29425, "total_steps": 33920, "loss": 0.2826, "lr": 5.25695593255311e-07, "epoch": 17.349646226415093, "percentage": 86.75, "elapsed_time": "0:56:31", "remaining_time": "0:08:38", "throughput": 5661.05, "total_tokens": 19201296} {"current_steps": 29430, "total_steps": 33920, "loss": 0.3581, "lr": 5.24547867107369e-07, "epoch": 17.35259433962264, "percentage": 86.76, "elapsed_time": "0:56:32", "remaining_time": "0:08:37", "throughput": 5661.06, "total_tokens": 19204496} {"current_steps": 29435, "total_steps": 33920, "loss": 0.352, "lr": 5.234013258546672e-07, "epoch": 17.35554245283019, "percentage": 86.78, "elapsed_time": "0:56:32", "remaining_time": "0:08:36", "throughput": 5661.04, "total_tokens": 19207280} {"current_steps": 29440, "total_steps": 33920, "loss": 0.3048, "lr": 5.222559698007563e-07, "epoch": 17.358490566037737, "percentage": 86.79, "elapsed_time": "0:56:33", "remaining_time": "0:08:36", "throughput": 5661.11, "total_tokens": 19210640} {"current_steps": 29445, "total_steps": 33920, "loss": 0.3254, "lr": 5.211117992488763e-07, "epoch": 17.361438679245282, "percentage": 86.81, "elapsed_time": "0:56:33", "remaining_time": "0:08:35", "throughput": 5661.08, "total_tokens": 19213680} {"current_steps": 29450, "total_steps": 33920, "loss": 0.3811, "lr": 5.199688145019505e-07, "epoch": 17.36438679245283, "percentage": 86.82, "elapsed_time": "0:56:34", "remaining_time": "0:08:35", "throughput": 5661.02, "total_tokens": 19216336} {"current_steps": 29455, "total_steps": 33920, "loss": 0.2949, "lr": 5.188270158625891e-07, "epoch": 17.36733490566038, "percentage": 86.84, "elapsed_time": "0:56:35", "remaining_time": "0:08:34", "throughput": 5661.12, "total_tokens": 19219600} {"current_steps": 29460, "total_steps": 33920, "loss": 0.4705, "lr": 5.176864036330875e-07, "epoch": 17.370283018867923, "percentage": 86.85, "elapsed_time": "0:56:35", "remaining_time": "0:08:34", "throughput": 5661.01, "total_tokens": 19222000} {"current_steps": 29465, "total_steps": 33920, "loss": 0.2213, "lr": 5.165469781154287e-07, "epoch": 17.37323113207547, "percentage": 86.87, "elapsed_time": "0:56:36", "remaining_time": "0:08:33", "throughput": 5661.18, "total_tokens": 19226320} {"current_steps": 29470, "total_steps": 33920, "loss": 0.2652, "lr": 5.154087396112789e-07, "epoch": 17.37617924528302, "percentage": 86.88, "elapsed_time": "0:56:36", "remaining_time": "0:08:32", "throughput": 5661.34, "total_tokens": 19230448} {"current_steps": 29475, "total_steps": 33920, "loss": 0.2501, "lr": 5.142716884219939e-07, "epoch": 17.379127358490567, "percentage": 86.9, "elapsed_time": "0:56:37", "remaining_time": "0:08:32", "throughput": 5661.36, "total_tokens": 19233392} {"current_steps": 29480, "total_steps": 33920, "loss": 0.2874, "lr": 5.131358248486118e-07, "epoch": 17.382075471698112, "percentage": 86.91, "elapsed_time": "0:56:37", "remaining_time": "0:08:31", "throughput": 5661.35, "total_tokens": 19236432} {"current_steps": 29485, "total_steps": 33920, "loss": 0.2896, "lr": 5.120011491918564e-07, "epoch": 17.38502358490566, "percentage": 86.93, "elapsed_time": "0:56:38", "remaining_time": "0:08:31", "throughput": 5661.49, "total_tokens": 19240496} {"current_steps": 29490, "total_steps": 33920, "loss": 0.338, "lr": 5.108676617521402e-07, "epoch": 17.38797169811321, "percentage": 86.94, "elapsed_time": "0:56:39", "remaining_time": "0:08:30", "throughput": 5661.35, "total_tokens": 19242960} {"current_steps": 29495, "total_steps": 33920, "loss": 0.3103, "lr": 5.097353628295571e-07, "epoch": 17.390919811320753, "percentage": 86.95, "elapsed_time": "0:56:39", "remaining_time": "0:08:30", "throughput": 5661.39, "total_tokens": 19246032} {"current_steps": 29500, "total_steps": 33920, "loss": 0.3332, "lr": 5.086042527238893e-07, "epoch": 17.3938679245283, "percentage": 86.97, "elapsed_time": "0:56:40", "remaining_time": "0:08:29", "throughput": 5661.39, "total_tokens": 19249488} {"current_steps": 29505, "total_steps": 33920, "loss": 0.3523, "lr": 5.074743317346009e-07, "epoch": 17.39681603773585, "percentage": 86.98, "elapsed_time": "0:56:40", "remaining_time": "0:08:28", "throughput": 5661.36, "total_tokens": 19252784} {"current_steps": 29510, "total_steps": 33920, "loss": 0.5155, "lr": 5.063456001608458e-07, "epoch": 17.399764150943398, "percentage": 87.0, "elapsed_time": "0:56:41", "remaining_time": "0:08:28", "throughput": 5661.41, "total_tokens": 19256080} {"current_steps": 29515, "total_steps": 33920, "loss": 0.2626, "lr": 5.052180583014599e-07, "epoch": 17.402712264150942, "percentage": 87.01, "elapsed_time": "0:56:41", "remaining_time": "0:08:27", "throughput": 5661.37, "total_tokens": 19258736} {"current_steps": 29520, "total_steps": 33920, "loss": 0.2374, "lr": 5.04091706454965e-07, "epoch": 17.40566037735849, "percentage": 87.03, "elapsed_time": "0:56:42", "remaining_time": "0:08:27", "throughput": 5661.18, "total_tokens": 19261072} {"current_steps": 29525, "total_steps": 33920, "loss": 0.326, "lr": 5.029665449195665e-07, "epoch": 17.40860849056604, "percentage": 87.04, "elapsed_time": "0:56:42", "remaining_time": "0:08:26", "throughput": 5661.13, "total_tokens": 19263632} {"current_steps": 29530, "total_steps": 33920, "loss": 0.2177, "lr": 5.018425739931559e-07, "epoch": 17.411556603773583, "percentage": 87.06, "elapsed_time": "0:56:43", "remaining_time": "0:08:25", "throughput": 5661.05, "total_tokens": 19266320} {"current_steps": 29535, "total_steps": 33920, "loss": 0.2709, "lr": 5.007197939733099e-07, "epoch": 17.41450471698113, "percentage": 87.07, "elapsed_time": "0:56:43", "remaining_time": "0:08:25", "throughput": 5661.18, "total_tokens": 19270320} {"current_steps": 29540, "total_steps": 33920, "loss": 0.2668, "lr": 4.995982051572895e-07, "epoch": 17.41745283018868, "percentage": 87.09, "elapsed_time": "0:56:44", "remaining_time": "0:08:24", "throughput": 5661.3, "total_tokens": 19274032} {"current_steps": 29545, "total_steps": 33920, "loss": 0.2502, "lr": 4.984778078420405e-07, "epoch": 17.420400943396228, "percentage": 87.1, "elapsed_time": "0:56:45", "remaining_time": "0:08:24", "throughput": 5661.38, "total_tokens": 19277520} {"current_steps": 29550, "total_steps": 33920, "loss": 0.3827, "lr": 4.973586023241917e-07, "epoch": 17.423349056603772, "percentage": 87.12, "elapsed_time": "0:56:45", "remaining_time": "0:08:23", "throughput": 5661.38, "total_tokens": 19280336} {"current_steps": 29555, "total_steps": 33920, "loss": 0.3391, "lr": 4.962405889000588e-07, "epoch": 17.42629716981132, "percentage": 87.13, "elapsed_time": "0:56:46", "remaining_time": "0:08:23", "throughput": 5661.46, "total_tokens": 19283472} {"current_steps": 29560, "total_steps": 33920, "loss": 0.3236, "lr": 4.951237678656396e-07, "epoch": 17.42924528301887, "percentage": 87.15, "elapsed_time": "0:56:46", "remaining_time": "0:08:22", "throughput": 5661.48, "total_tokens": 19287024} {"current_steps": 29565, "total_steps": 33920, "loss": 0.3463, "lr": 4.940081395166174e-07, "epoch": 17.432193396226417, "percentage": 87.16, "elapsed_time": "0:56:47", "remaining_time": "0:08:21", "throughput": 5661.61, "total_tokens": 19290544} {"current_steps": 29570, "total_steps": 33920, "loss": 0.3387, "lr": 4.928937041483606e-07, "epoch": 17.43514150943396, "percentage": 87.18, "elapsed_time": "0:56:47", "remaining_time": "0:08:21", "throughput": 5661.83, "total_tokens": 19295184} {"current_steps": 29575, "total_steps": 33920, "loss": 0.1971, "lr": 4.917804620559202e-07, "epoch": 17.43808962264151, "percentage": 87.19, "elapsed_time": "0:56:48", "remaining_time": "0:08:20", "throughput": 5661.81, "total_tokens": 19298160} {"current_steps": 29580, "total_steps": 33920, "loss": 0.4083, "lr": 4.906684135340317e-07, "epoch": 17.441037735849058, "percentage": 87.21, "elapsed_time": "0:56:48", "remaining_time": "0:08:20", "throughput": 5661.79, "total_tokens": 19300976} {"current_steps": 29585, "total_steps": 33920, "loss": 0.457, "lr": 4.89557558877114e-07, "epoch": 17.443985849056602, "percentage": 87.22, "elapsed_time": "0:56:49", "remaining_time": "0:08:19", "throughput": 5661.83, "total_tokens": 19304048} {"current_steps": 29590, "total_steps": 33920, "loss": 0.2452, "lr": 4.884478983792728e-07, "epoch": 17.44693396226415, "percentage": 87.23, "elapsed_time": "0:56:50", "remaining_time": "0:08:18", "throughput": 5661.92, "total_tokens": 19307248} {"current_steps": 29595, "total_steps": 33920, "loss": 0.2956, "lr": 4.873394323342939e-07, "epoch": 17.4498820754717, "percentage": 87.25, "elapsed_time": "0:56:50", "remaining_time": "0:08:18", "throughput": 5661.93, "total_tokens": 19310608} {"current_steps": 29600, "total_steps": 33920, "loss": 0.2721, "lr": 4.86232161035648e-07, "epoch": 17.452830188679247, "percentage": 87.26, "elapsed_time": "0:56:51", "remaining_time": "0:08:17", "throughput": 5661.94, "total_tokens": 19313584} {"current_steps": 29605, "total_steps": 33920, "loss": 0.301, "lr": 4.851260847764916e-07, "epoch": 17.45577830188679, "percentage": 87.28, "elapsed_time": "0:56:51", "remaining_time": "0:08:17", "throughput": 5662.07, "total_tokens": 19317968} {"current_steps": 29610, "total_steps": 33920, "loss": 0.317, "lr": 4.840212038496622e-07, "epoch": 17.45872641509434, "percentage": 87.29, "elapsed_time": "0:56:52", "remaining_time": "0:08:16", "throughput": 5662.1, "total_tokens": 19321104} {"current_steps": 29615, "total_steps": 33920, "loss": 0.331, "lr": 4.82917518547682e-07, "epoch": 17.461674528301888, "percentage": 87.31, "elapsed_time": "0:56:52", "remaining_time": "0:08:16", "throughput": 5662.21, "total_tokens": 19324656} {"current_steps": 29620, "total_steps": 33920, "loss": 0.3208, "lr": 4.81815029162756e-07, "epoch": 17.464622641509433, "percentage": 87.32, "elapsed_time": "0:56:53", "remaining_time": "0:08:15", "throughput": 5662.23, "total_tokens": 19327920} {"current_steps": 29625, "total_steps": 33920, "loss": 0.291, "lr": 4.807137359867725e-07, "epoch": 17.46757075471698, "percentage": 87.34, "elapsed_time": "0:56:53", "remaining_time": "0:08:14", "throughput": 5662.22, "total_tokens": 19330800} {"current_steps": 29630, "total_steps": 33920, "loss": 0.2731, "lr": 4.79613639311306e-07, "epoch": 17.47051886792453, "percentage": 87.35, "elapsed_time": "0:56:54", "remaining_time": "0:08:14", "throughput": 5662.28, "total_tokens": 19334320} {"current_steps": 29635, "total_steps": 33920, "loss": 0.2686, "lr": 4.785147394276096e-07, "epoch": 17.473466981132077, "percentage": 87.37, "elapsed_time": "0:56:55", "remaining_time": "0:08:13", "throughput": 5662.35, "total_tokens": 19337648} {"current_steps": 29640, "total_steps": 33920, "loss": 0.3165, "lr": 4.774170366266223e-07, "epoch": 17.47641509433962, "percentage": 87.38, "elapsed_time": "0:56:55", "remaining_time": "0:08:13", "throughput": 5662.29, "total_tokens": 19340976} {"current_steps": 29645, "total_steps": 33920, "loss": 0.4306, "lr": 4.763205311989666e-07, "epoch": 17.47936320754717, "percentage": 87.4, "elapsed_time": "0:56:56", "remaining_time": "0:08:12", "throughput": 5662.33, "total_tokens": 19344080} {"current_steps": 29650, "total_steps": 33920, "loss": 0.4194, "lr": 4.752252234349458e-07, "epoch": 17.482311320754718, "percentage": 87.41, "elapsed_time": "0:56:56", "remaining_time": "0:08:12", "throughput": 5662.59, "total_tokens": 19348816} {"current_steps": 29655, "total_steps": 33920, "loss": 0.2636, "lr": 4.7413111362454634e-07, "epoch": 17.485259433962263, "percentage": 87.43, "elapsed_time": "0:56:57", "remaining_time": "0:08:11", "throughput": 5662.64, "total_tokens": 19351824} {"current_steps": 29660, "total_steps": 33920, "loss": 0.311, "lr": 4.7303820205744143e-07, "epoch": 17.48820754716981, "percentage": 87.44, "elapsed_time": "0:56:58", "remaining_time": "0:08:10", "throughput": 5662.85, "total_tokens": 19356368} {"current_steps": 29665, "total_steps": 33920, "loss": 0.3681, "lr": 4.7194648902298303e-07, "epoch": 17.49115566037736, "percentage": 87.46, "elapsed_time": "0:56:58", "remaining_time": "0:08:10", "throughput": 5662.88, "total_tokens": 19359536} {"current_steps": 29670, "total_steps": 33920, "loss": 0.2564, "lr": 4.7085597481020594e-07, "epoch": 17.494103773584907, "percentage": 87.47, "elapsed_time": "0:56:59", "remaining_time": "0:08:09", "throughput": 5662.89, "total_tokens": 19362832} {"current_steps": 29675, "total_steps": 33920, "loss": 0.4519, "lr": 4.697666597078293e-07, "epoch": 17.497051886792452, "percentage": 87.49, "elapsed_time": "0:56:59", "remaining_time": "0:08:09", "throughput": 5662.77, "total_tokens": 19365264} {"current_steps": 29680, "total_steps": 33920, "loss": 0.276, "lr": 4.6867854400425237e-07, "epoch": 17.5, "percentage": 87.5, "elapsed_time": "0:57:00", "remaining_time": "0:08:08", "throughput": 5662.74, "total_tokens": 19368048} {"current_steps": 29685, "total_steps": 33920, "loss": 0.3494, "lr": 4.6759162798756084e-07, "epoch": 17.502948113207548, "percentage": 87.51, "elapsed_time": "0:57:00", "remaining_time": "0:08:08", "throughput": 5662.77, "total_tokens": 19371248} {"current_steps": 29690, "total_steps": 33920, "loss": 0.3489, "lr": 4.6650591194551895e-07, "epoch": 17.505896226415093, "percentage": 87.53, "elapsed_time": "0:57:01", "remaining_time": "0:08:07", "throughput": 5662.72, "total_tokens": 19373904} {"current_steps": 29695, "total_steps": 33920, "loss": 0.2702, "lr": 4.654213961655757e-07, "epoch": 17.50884433962264, "percentage": 87.54, "elapsed_time": "0:57:01", "remaining_time": "0:08:06", "throughput": 5662.76, "total_tokens": 19377168} {"current_steps": 29700, "total_steps": 33920, "loss": 0.2467, "lr": 4.6433808093486075e-07, "epoch": 17.51179245283019, "percentage": 87.56, "elapsed_time": "0:57:02", "remaining_time": "0:08:06", "throughput": 5662.79, "total_tokens": 19380560} {"current_steps": 29705, "total_steps": 33920, "loss": 0.3421, "lr": 4.63255966540187e-07, "epoch": 17.514740566037737, "percentage": 87.57, "elapsed_time": "0:57:02", "remaining_time": "0:08:05", "throughput": 5662.83, "total_tokens": 19383728} {"current_steps": 29710, "total_steps": 33920, "loss": 0.3978, "lr": 4.62175053268048e-07, "epoch": 17.517688679245282, "percentage": 87.59, "elapsed_time": "0:57:03", "remaining_time": "0:08:05", "throughput": 5662.94, "total_tokens": 19387248} {"current_steps": 29715, "total_steps": 33920, "loss": 0.3003, "lr": 4.6109534140462045e-07, "epoch": 17.52063679245283, "percentage": 87.6, "elapsed_time": "0:57:04", "remaining_time": "0:08:04", "throughput": 5662.86, "total_tokens": 19389968} {"current_steps": 29720, "total_steps": 33920, "loss": 0.2801, "lr": 4.6001683123576226e-07, "epoch": 17.52358490566038, "percentage": 87.62, "elapsed_time": "0:57:04", "remaining_time": "0:08:03", "throughput": 5662.91, "total_tokens": 19393232} {"current_steps": 29725, "total_steps": 33920, "loss": 0.2981, "lr": 4.589395230470145e-07, "epoch": 17.526533018867923, "percentage": 87.63, "elapsed_time": "0:57:05", "remaining_time": "0:08:03", "throughput": 5662.86, "total_tokens": 19396016} {"current_steps": 29730, "total_steps": 33920, "loss": 0.272, "lr": 4.578634171235996e-07, "epoch": 17.52948113207547, "percentage": 87.65, "elapsed_time": "0:57:05", "remaining_time": "0:08:02", "throughput": 5662.86, "total_tokens": 19399248} {"current_steps": 29735, "total_steps": 33920, "loss": 0.4159, "lr": 4.567885137504202e-07, "epoch": 17.53242924528302, "percentage": 87.66, "elapsed_time": "0:57:06", "remaining_time": "0:08:02", "throughput": 5662.93, "total_tokens": 19402544} {"current_steps": 29740, "total_steps": 33920, "loss": 0.2357, "lr": 4.55714813212062e-07, "epoch": 17.535377358490567, "percentage": 87.68, "elapsed_time": "0:57:06", "remaining_time": "0:08:01", "throughput": 5662.92, "total_tokens": 19405264} {"current_steps": 29745, "total_steps": 33920, "loss": 0.319, "lr": 4.5464231579279206e-07, "epoch": 17.538325471698112, "percentage": 87.69, "elapsed_time": "0:57:07", "remaining_time": "0:08:01", "throughput": 5663.03, "total_tokens": 19408720} {"current_steps": 29750, "total_steps": 33920, "loss": 0.264, "lr": 4.535710217765571e-07, "epoch": 17.54127358490566, "percentage": 87.71, "elapsed_time": "0:57:07", "remaining_time": "0:08:00", "throughput": 5663.13, "total_tokens": 19412304} {"current_steps": 29755, "total_steps": 33920, "loss": 0.2706, "lr": 4.5250093144698913e-07, "epoch": 17.54422169811321, "percentage": 87.72, "elapsed_time": "0:57:08", "remaining_time": "0:07:59", "throughput": 5663.16, "total_tokens": 19415216} {"current_steps": 29760, "total_steps": 33920, "loss": 0.2453, "lr": 4.514320450873988e-07, "epoch": 17.547169811320753, "percentage": 87.74, "elapsed_time": "0:57:08", "remaining_time": "0:07:59", "throughput": 5663.38, "total_tokens": 19419600} {"current_steps": 29765, "total_steps": 33920, "loss": 0.2474, "lr": 4.503643629807769e-07, "epoch": 17.5501179245283, "percentage": 87.75, "elapsed_time": "0:57:09", "remaining_time": "0:07:58", "throughput": 5663.23, "total_tokens": 19421872} {"current_steps": 29770, "total_steps": 33920, "loss": 0.3223, "lr": 4.4929788540979844e-07, "epoch": 17.55306603773585, "percentage": 87.77, "elapsed_time": "0:57:10", "remaining_time": "0:07:58", "throughput": 5663.24, "total_tokens": 19425136} {"current_steps": 29775, "total_steps": 33920, "loss": 0.3028, "lr": 4.4823261265681596e-07, "epoch": 17.556014150943398, "percentage": 87.78, "elapsed_time": "0:57:10", "remaining_time": "0:07:57", "throughput": 5663.48, "total_tokens": 19430288} {"current_steps": 29780, "total_steps": 33920, "loss": 0.3121, "lr": 4.471685450038671e-07, "epoch": 17.558962264150942, "percentage": 87.79, "elapsed_time": "0:57:11", "remaining_time": "0:07:57", "throughput": 5663.45, "total_tokens": 19433392} {"current_steps": 29785, "total_steps": 33920, "loss": 0.2639, "lr": 4.4610568273266706e-07, "epoch": 17.56191037735849, "percentage": 87.81, "elapsed_time": "0:57:11", "remaining_time": "0:07:56", "throughput": 5663.55, "total_tokens": 19436752} {"current_steps": 29790, "total_steps": 33920, "loss": 0.291, "lr": 4.450440261246142e-07, "epoch": 17.56485849056604, "percentage": 87.82, "elapsed_time": "0:57:12", "remaining_time": "0:07:55", "throughput": 5663.56, "total_tokens": 19440112} {"current_steps": 29795, "total_steps": 33920, "loss": 0.2637, "lr": 4.439835754607863e-07, "epoch": 17.567806603773583, "percentage": 87.84, "elapsed_time": "0:57:13", "remaining_time": "0:07:55", "throughput": 5663.49, "total_tokens": 19443088} {"current_steps": 29800, "total_steps": 33920, "loss": 0.3194, "lr": 4.429243310219422e-07, "epoch": 17.57075471698113, "percentage": 87.85, "elapsed_time": "0:57:13", "remaining_time": "0:07:54", "throughput": 5663.67, "total_tokens": 19447056} {"current_steps": 29805, "total_steps": 33920, "loss": 0.3207, "lr": 4.418662930885215e-07, "epoch": 17.57370283018868, "percentage": 87.87, "elapsed_time": "0:57:14", "remaining_time": "0:07:54", "throughput": 5663.73, "total_tokens": 19450640} {"current_steps": 29810, "total_steps": 33920, "loss": 0.2822, "lr": 4.408094619406439e-07, "epoch": 17.576650943396228, "percentage": 87.88, "elapsed_time": "0:57:14", "remaining_time": "0:07:53", "throughput": 5663.7, "total_tokens": 19453840} {"current_steps": 29815, "total_steps": 33920, "loss": 0.2301, "lr": 4.3975383785810954e-07, "epoch": 17.579599056603772, "percentage": 87.9, "elapsed_time": "0:57:15", "remaining_time": "0:07:52", "throughput": 5663.75, "total_tokens": 19457424} {"current_steps": 29820, "total_steps": 33920, "loss": 0.3121, "lr": 4.3869942112040096e-07, "epoch": 17.58254716981132, "percentage": 87.91, "elapsed_time": "0:57:16", "remaining_time": "0:07:52", "throughput": 5664.03, "total_tokens": 19463376} {"current_steps": 29825, "total_steps": 33920, "loss": 0.3803, "lr": 4.3764621200667936e-07, "epoch": 17.58549528301887, "percentage": 87.93, "elapsed_time": "0:57:16", "remaining_time": "0:07:51", "throughput": 5664.12, "total_tokens": 19466736} {"current_steps": 29830, "total_steps": 33920, "loss": 0.2282, "lr": 4.365942107957849e-07, "epoch": 17.588443396226417, "percentage": 87.94, "elapsed_time": "0:57:17", "remaining_time": "0:07:51", "throughput": 5664.02, "total_tokens": 19469168} {"current_steps": 29835, "total_steps": 33920, "loss": 0.2505, "lr": 4.35543417766241e-07, "epoch": 17.59139150943396, "percentage": 87.96, "elapsed_time": "0:57:17", "remaining_time": "0:07:50", "throughput": 5664.07, "total_tokens": 19472688} {"current_steps": 29840, "total_steps": 33920, "loss": 0.3478, "lr": 4.3449383319624785e-07, "epoch": 17.59433962264151, "percentage": 87.97, "elapsed_time": "0:57:18", "remaining_time": "0:07:50", "throughput": 5664.13, "total_tokens": 19476016} {"current_steps": 29845, "total_steps": 33920, "loss": 0.3952, "lr": 4.3344545736368926e-07, "epoch": 17.597287735849058, "percentage": 87.99, "elapsed_time": "0:57:19", "remaining_time": "0:07:49", "throughput": 5664.17, "total_tokens": 19479248} {"current_steps": 29850, "total_steps": 33920, "loss": 0.3353, "lr": 4.323982905461266e-07, "epoch": 17.600235849056602, "percentage": 88.0, "elapsed_time": "0:57:19", "remaining_time": "0:07:48", "throughput": 5664.29, "total_tokens": 19483152} {"current_steps": 29855, "total_steps": 33920, "loss": 0.3586, "lr": 4.313523330208019e-07, "epoch": 17.60318396226415, "percentage": 88.02, "elapsed_time": "0:57:20", "remaining_time": "0:07:48", "throughput": 5664.42, "total_tokens": 19486864} {"current_steps": 29860, "total_steps": 33920, "loss": 0.2687, "lr": 4.303075850646371e-07, "epoch": 17.6061320754717, "percentage": 88.03, "elapsed_time": "0:57:20", "remaining_time": "0:07:47", "throughput": 5664.42, "total_tokens": 19489680} {"current_steps": 29865, "total_steps": 33920, "loss": 0.3526, "lr": 4.2926404695423305e-07, "epoch": 17.609080188679247, "percentage": 88.05, "elapsed_time": "0:57:21", "remaining_time": "0:07:47", "throughput": 5664.26, "total_tokens": 19492080} {"current_steps": 29870, "total_steps": 33920, "loss": 0.313, "lr": 4.282217189658705e-07, "epoch": 17.61202830188679, "percentage": 88.06, "elapsed_time": "0:57:21", "remaining_time": "0:07:46", "throughput": 5664.3, "total_tokens": 19495184} {"current_steps": 29875, "total_steps": 33920, "loss": 0.354, "lr": 4.27180601375512e-07, "epoch": 17.61497641509434, "percentage": 88.07, "elapsed_time": "0:57:22", "remaining_time": "0:07:46", "throughput": 5664.32, "total_tokens": 19498160} {"current_steps": 29880, "total_steps": 33920, "loss": 0.3712, "lr": 4.2614069445879646e-07, "epoch": 17.617924528301888, "percentage": 88.09, "elapsed_time": "0:57:22", "remaining_time": "0:07:45", "throughput": 5664.48, "total_tokens": 19501968} {"current_steps": 29885, "total_steps": 33920, "loss": 0.4004, "lr": 4.251019984910448e-07, "epoch": 17.620872641509433, "percentage": 88.1, "elapsed_time": "0:57:23", "remaining_time": "0:07:44", "throughput": 5664.51, "total_tokens": 19505072} {"current_steps": 29890, "total_steps": 33920, "loss": 0.3436, "lr": 4.2406451374725597e-07, "epoch": 17.62382075471698, "percentage": 88.12, "elapsed_time": "0:57:23", "remaining_time": "0:07:44", "throughput": 5664.5, "total_tokens": 19508016} {"current_steps": 29895, "total_steps": 33920, "loss": 0.2946, "lr": 4.2302824050210855e-07, "epoch": 17.62676886792453, "percentage": 88.13, "elapsed_time": "0:57:24", "remaining_time": "0:07:43", "throughput": 5664.33, "total_tokens": 19510640} {"current_steps": 29900, "total_steps": 33920, "loss": 0.2977, "lr": 4.2199317902995974e-07, "epoch": 17.629716981132077, "percentage": 88.15, "elapsed_time": "0:57:25", "remaining_time": "0:07:43", "throughput": 5664.5, "total_tokens": 19515120} {"current_steps": 29905, "total_steps": 33920, "loss": 0.2225, "lr": 4.209593296048459e-07, "epoch": 17.63266509433962, "percentage": 88.16, "elapsed_time": "0:57:25", "remaining_time": "0:07:42", "throughput": 5664.32, "total_tokens": 19517616} {"current_steps": 29910, "total_steps": 33920, "loss": 0.3369, "lr": 4.1992669250048524e-07, "epoch": 17.63561320754717, "percentage": 88.18, "elapsed_time": "0:57:26", "remaining_time": "0:07:42", "throughput": 5664.29, "total_tokens": 19520976} {"current_steps": 29915, "total_steps": 33920, "loss": 0.4101, "lr": 4.188952679902719e-07, "epoch": 17.638561320754718, "percentage": 88.19, "elapsed_time": "0:57:26", "remaining_time": "0:07:41", "throughput": 5664.27, "total_tokens": 19523984} {"current_steps": 29920, "total_steps": 33920, "loss": 0.3525, "lr": 4.178650563472797e-07, "epoch": 17.641509433962263, "percentage": 88.21, "elapsed_time": "0:57:27", "remaining_time": "0:07:40", "throughput": 5664.31, "total_tokens": 19527600} {"current_steps": 29925, "total_steps": 33920, "loss": 0.1958, "lr": 4.168360578442615e-07, "epoch": 17.64445754716981, "percentage": 88.22, "elapsed_time": "0:57:28", "remaining_time": "0:07:40", "throughput": 5664.36, "total_tokens": 19531088} {"current_steps": 29930, "total_steps": 33920, "loss": 0.4181, "lr": 4.1580827275365e-07, "epoch": 17.64740566037736, "percentage": 88.24, "elapsed_time": "0:57:28", "remaining_time": "0:07:39", "throughput": 5664.36, "total_tokens": 19534096} {"current_steps": 29935, "total_steps": 33920, "loss": 0.2538, "lr": 4.147817013475536e-07, "epoch": 17.650353773584907, "percentage": 88.25, "elapsed_time": "0:57:29", "remaining_time": "0:07:39", "throughput": 5664.34, "total_tokens": 19537104} {"current_steps": 29940, "total_steps": 33920, "loss": 0.364, "lr": 4.1375634389776375e-07, "epoch": 17.653301886792452, "percentage": 88.27, "elapsed_time": "0:57:29", "remaining_time": "0:07:38", "throughput": 5664.31, "total_tokens": 19539792} {"current_steps": 29945, "total_steps": 33920, "loss": 0.3605, "lr": 4.127322006757478e-07, "epoch": 17.65625, "percentage": 88.28, "elapsed_time": "0:57:30", "remaining_time": "0:07:37", "throughput": 5664.32, "total_tokens": 19542736} {"current_steps": 29950, "total_steps": 33920, "loss": 0.3084, "lr": 4.1170927195265163e-07, "epoch": 17.659198113207548, "percentage": 88.3, "elapsed_time": "0:57:30", "remaining_time": "0:07:37", "throughput": 5664.26, "total_tokens": 19545808} {"current_steps": 29955, "total_steps": 33920, "loss": 0.3281, "lr": 4.1068755799930026e-07, "epoch": 17.662146226415093, "percentage": 88.31, "elapsed_time": "0:57:31", "remaining_time": "0:07:36", "throughput": 5664.18, "total_tokens": 19548560} {"current_steps": 29960, "total_steps": 33920, "loss": 0.2985, "lr": 4.096670590861962e-07, "epoch": 17.66509433962264, "percentage": 88.33, "elapsed_time": "0:57:31", "remaining_time": "0:07:36", "throughput": 5664.09, "total_tokens": 19551152} {"current_steps": 29965, "total_steps": 33920, "loss": 0.2938, "lr": 4.086477754835211e-07, "epoch": 17.66804245283019, "percentage": 88.34, "elapsed_time": "0:57:32", "remaining_time": "0:07:35", "throughput": 5664.08, "total_tokens": 19554096} {"current_steps": 29970, "total_steps": 33920, "loss": 0.2838, "lr": 4.0762970746113517e-07, "epoch": 17.670990566037737, "percentage": 88.35, "elapsed_time": "0:57:32", "remaining_time": "0:07:35", "throughput": 5664.11, "total_tokens": 19557712} {"current_steps": 29975, "total_steps": 33920, "loss": 0.3082, "lr": 4.0661285528857676e-07, "epoch": 17.673938679245282, "percentage": 88.37, "elapsed_time": "0:57:33", "remaining_time": "0:07:34", "throughput": 5664.07, "total_tokens": 19560752} {"current_steps": 29980, "total_steps": 33920, "loss": 0.269, "lr": 4.0559721923506155e-07, "epoch": 17.67688679245283, "percentage": 88.38, "elapsed_time": "0:57:34", "remaining_time": "0:07:33", "throughput": 5664.09, "total_tokens": 19563952} {"current_steps": 29985, "total_steps": 33920, "loss": 0.3325, "lr": 4.045827995694834e-07, "epoch": 17.67983490566038, "percentage": 88.4, "elapsed_time": "0:57:34", "remaining_time": "0:07:33", "throughput": 5664.04, "total_tokens": 19566832} {"current_steps": 29990, "total_steps": 33920, "loss": 0.3582, "lr": 4.035695965604142e-07, "epoch": 17.682783018867923, "percentage": 88.41, "elapsed_time": "0:57:35", "remaining_time": "0:07:32", "throughput": 5664.07, "total_tokens": 19569840} {"current_steps": 29995, "total_steps": 33920, "loss": 0.2413, "lr": 4.0255761047610365e-07, "epoch": 17.68573113207547, "percentage": 88.43, "elapsed_time": "0:57:35", "remaining_time": "0:07:32", "throughput": 5664.1, "total_tokens": 19572944} {"current_steps": 30000, "total_steps": 33920, "loss": 0.3416, "lr": 4.0154684158447864e-07, "epoch": 17.68867924528302, "percentage": 88.44, "elapsed_time": "0:57:36", "remaining_time": "0:07:31", "throughput": 5664.23, "total_tokens": 19576880} {"current_steps": 30005, "total_steps": 33920, "loss": 0.2505, "lr": 4.0053729015314623e-07, "epoch": 17.691627358490567, "percentage": 88.46, "elapsed_time": "0:57:36", "remaining_time": "0:07:31", "throughput": 5664.27, "total_tokens": 19580240} {"current_steps": 30010, "total_steps": 33920, "loss": 0.3053, "lr": 3.9952895644938926e-07, "epoch": 17.694575471698112, "percentage": 88.47, "elapsed_time": "0:57:37", "remaining_time": "0:07:30", "throughput": 5664.28, "total_tokens": 19583280} {"current_steps": 30015, "total_steps": 33920, "loss": 0.3301, "lr": 3.985218407401681e-07, "epoch": 17.69752358490566, "percentage": 88.49, "elapsed_time": "0:57:37", "remaining_time": "0:07:29", "throughput": 5664.32, "total_tokens": 19586736} {"current_steps": 30020, "total_steps": 33920, "loss": 0.2569, "lr": 3.975159432921205e-07, "epoch": 17.70047169811321, "percentage": 88.5, "elapsed_time": "0:57:38", "remaining_time": "0:07:29", "throughput": 5664.47, "total_tokens": 19590544} {"current_steps": 30025, "total_steps": 33920, "loss": 0.2829, "lr": 3.9651126437156294e-07, "epoch": 17.703419811320753, "percentage": 88.52, "elapsed_time": "0:57:39", "remaining_time": "0:07:28", "throughput": 5664.59, "total_tokens": 19594160} {"current_steps": 30030, "total_steps": 33920, "loss": 0.2393, "lr": 3.9550780424448653e-07, "epoch": 17.7063679245283, "percentage": 88.53, "elapsed_time": "0:57:39", "remaining_time": "0:07:28", "throughput": 5664.53, "total_tokens": 19597296} {"current_steps": 30035, "total_steps": 33920, "loss": 0.3034, "lr": 3.9450556317656487e-07, "epoch": 17.70931603773585, "percentage": 88.55, "elapsed_time": "0:57:40", "remaining_time": "0:07:27", "throughput": 5664.69, "total_tokens": 19600976} {"current_steps": 30040, "total_steps": 33920, "loss": 0.3863, "lr": 3.935045414331434e-07, "epoch": 17.712264150943398, "percentage": 88.56, "elapsed_time": "0:57:40", "remaining_time": "0:07:27", "throughput": 5664.77, "total_tokens": 19605008} {"current_steps": 30045, "total_steps": 33920, "loss": 0.3222, "lr": 3.925047392792475e-07, "epoch": 17.715212264150942, "percentage": 88.58, "elapsed_time": "0:57:41", "remaining_time": "0:07:26", "throughput": 5664.94, "total_tokens": 19608944} {"current_steps": 30050, "total_steps": 33920, "loss": 0.2717, "lr": 3.9150615697957917e-07, "epoch": 17.71816037735849, "percentage": 88.59, "elapsed_time": "0:57:41", "remaining_time": "0:07:25", "throughput": 5664.95, "total_tokens": 19612016} {"current_steps": 30055, "total_steps": 33920, "loss": 0.3504, "lr": 3.9050879479851753e-07, "epoch": 17.72110849056604, "percentage": 88.61, "elapsed_time": "0:57:42", "remaining_time": "0:07:25", "throughput": 5665.08, "total_tokens": 19615632} {"current_steps": 30060, "total_steps": 33920, "loss": 0.3382, "lr": 3.89512653000117e-07, "epoch": 17.724056603773583, "percentage": 88.62, "elapsed_time": "0:57:43", "remaining_time": "0:07:24", "throughput": 5665.0, "total_tokens": 19618160} {"current_steps": 30065, "total_steps": 33920, "loss": 0.3233, "lr": 3.8851773184811203e-07, "epoch": 17.72700471698113, "percentage": 88.64, "elapsed_time": "0:57:43", "remaining_time": "0:07:24", "throughput": 5664.91, "total_tokens": 19620784} {"current_steps": 30070, "total_steps": 33920, "loss": 0.2703, "lr": 3.8752403160591255e-07, "epoch": 17.72995283018868, "percentage": 88.65, "elapsed_time": "0:57:44", "remaining_time": "0:07:23", "throughput": 5664.83, "total_tokens": 19623408} {"current_steps": 30075, "total_steps": 33920, "loss": 0.3463, "lr": 3.8653155253660477e-07, "epoch": 17.732900943396228, "percentage": 88.66, "elapsed_time": "0:57:44", "remaining_time": "0:07:22", "throughput": 5664.86, "total_tokens": 19626832} {"current_steps": 30080, "total_steps": 33920, "loss": 0.2681, "lr": 3.8554029490295073e-07, "epoch": 17.735849056603772, "percentage": 88.68, "elapsed_time": "0:57:45", "remaining_time": "0:07:22", "throughput": 5664.96, "total_tokens": 19630224} {"current_steps": 30085, "total_steps": 33920, "loss": 0.2114, "lr": 3.8455025896739164e-07, "epoch": 17.73879716981132, "percentage": 88.69, "elapsed_time": "0:57:45", "remaining_time": "0:07:21", "throughput": 5664.84, "total_tokens": 19632656} {"current_steps": 30090, "total_steps": 33920, "loss": 0.3769, "lr": 3.8356144499204215e-07, "epoch": 17.74174528301887, "percentage": 88.71, "elapsed_time": "0:57:46", "remaining_time": "0:07:21", "throughput": 5664.94, "total_tokens": 19636400} {"current_steps": 30095, "total_steps": 33920, "loss": 0.3341, "lr": 3.8257385323869576e-07, "epoch": 17.744693396226417, "percentage": 88.72, "elapsed_time": "0:57:46", "remaining_time": "0:07:20", "throughput": 5664.95, "total_tokens": 19639440} {"current_steps": 30100, "total_steps": 33920, "loss": 0.2892, "lr": 3.815874839688222e-07, "epoch": 17.74764150943396, "percentage": 88.74, "elapsed_time": "0:57:47", "remaining_time": "0:07:20", "throughput": 5665.1, "total_tokens": 19643536} {"current_steps": 30105, "total_steps": 33920, "loss": 0.2481, "lr": 3.8060233744356634e-07, "epoch": 17.75058962264151, "percentage": 88.75, "elapsed_time": "0:57:47", "remaining_time": "0:07:19", "throughput": 5665.06, "total_tokens": 19646224} {"current_steps": 30110, "total_steps": 33920, "loss": 0.2878, "lr": 3.796184139237502e-07, "epoch": 17.753537735849058, "percentage": 88.77, "elapsed_time": "0:57:48", "remaining_time": "0:07:18", "throughput": 5664.98, "total_tokens": 19648848} {"current_steps": 30115, "total_steps": 33920, "loss": 0.2424, "lr": 3.7863571366987206e-07, "epoch": 17.756485849056602, "percentage": 88.78, "elapsed_time": "0:57:49", "remaining_time": "0:07:18", "throughput": 5665.09, "total_tokens": 19652560} {"current_steps": 30120, "total_steps": 33920, "loss": 0.2921, "lr": 3.776542369421049e-07, "epoch": 17.75943396226415, "percentage": 88.8, "elapsed_time": "0:57:49", "remaining_time": "0:07:17", "throughput": 5665.05, "total_tokens": 19655440} {"current_steps": 30125, "total_steps": 33920, "loss": 0.2471, "lr": 3.766739840003003e-07, "epoch": 17.7623820754717, "percentage": 88.81, "elapsed_time": "0:57:50", "remaining_time": "0:07:17", "throughput": 5664.92, "total_tokens": 19657936} {"current_steps": 30130, "total_steps": 33920, "loss": 0.3031, "lr": 3.756949551039835e-07, "epoch": 17.765330188679247, "percentage": 88.83, "elapsed_time": "0:57:50", "remaining_time": "0:07:16", "throughput": 5665.08, "total_tokens": 19662544} {"current_steps": 30135, "total_steps": 33920, "loss": 0.2436, "lr": 3.7471715051235757e-07, "epoch": 17.76827830188679, "percentage": 88.84, "elapsed_time": "0:57:51", "remaining_time": "0:07:16", "throughput": 5665.23, "total_tokens": 19666416} {"current_steps": 30140, "total_steps": 33920, "loss": 0.3651, "lr": 3.7374057048429947e-07, "epoch": 17.77122641509434, "percentage": 88.86, "elapsed_time": "0:57:51", "remaining_time": "0:07:15", "throughput": 5665.12, "total_tokens": 19669040} {"current_steps": 30145, "total_steps": 33920, "loss": 0.4039, "lr": 3.7276521527836396e-07, "epoch": 17.774174528301888, "percentage": 88.87, "elapsed_time": "0:57:52", "remaining_time": "0:07:14", "throughput": 5665.35, "total_tokens": 19673648} {"current_steps": 30150, "total_steps": 33920, "loss": 0.2903, "lr": 3.717910851527784e-07, "epoch": 17.777122641509433, "percentage": 88.89, "elapsed_time": "0:57:53", "remaining_time": "0:07:14", "throughput": 5665.36, "total_tokens": 19676528} {"current_steps": 30155, "total_steps": 33920, "loss": 0.244, "lr": 3.708181803654498e-07, "epoch": 17.78007075471698, "percentage": 88.9, "elapsed_time": "0:57:53", "remaining_time": "0:07:13", "throughput": 5665.4, "total_tokens": 19679696} {"current_steps": 30160, "total_steps": 33920, "loss": 0.2425, "lr": 3.6984650117395993e-07, "epoch": 17.78301886792453, "percentage": 88.92, "elapsed_time": "0:57:54", "remaining_time": "0:07:13", "throughput": 5665.28, "total_tokens": 19682512} {"current_steps": 30165, "total_steps": 33920, "loss": 0.2804, "lr": 3.688760478355635e-07, "epoch": 17.785966981132077, "percentage": 88.93, "elapsed_time": "0:57:54", "remaining_time": "0:07:12", "throughput": 5665.25, "total_tokens": 19685552} {"current_steps": 30170, "total_steps": 33920, "loss": 0.3399, "lr": 3.679068206071923e-07, "epoch": 17.78891509433962, "percentage": 88.94, "elapsed_time": "0:57:55", "remaining_time": "0:07:11", "throughput": 5665.13, "total_tokens": 19688048} {"current_steps": 30175, "total_steps": 33920, "loss": 0.2963, "lr": 3.669388197454532e-07, "epoch": 17.79186320754717, "percentage": 88.96, "elapsed_time": "0:57:55", "remaining_time": "0:07:11", "throughput": 5665.12, "total_tokens": 19690960} {"current_steps": 30180, "total_steps": 33920, "loss": 0.2896, "lr": 3.6597204550662956e-07, "epoch": 17.794811320754718, "percentage": 88.97, "elapsed_time": "0:57:56", "remaining_time": "0:07:10", "throughput": 5665.13, "total_tokens": 19693936} {"current_steps": 30185, "total_steps": 33920, "loss": 0.29, "lr": 3.650064981466772e-07, "epoch": 17.797759433962263, "percentage": 88.99, "elapsed_time": "0:57:56", "remaining_time": "0:07:10", "throughput": 5665.14, "total_tokens": 19697072} {"current_steps": 30190, "total_steps": 33920, "loss": 0.2891, "lr": 3.640421779212311e-07, "epoch": 17.80070754716981, "percentage": 89.0, "elapsed_time": "0:57:57", "remaining_time": "0:07:09", "throughput": 5665.06, "total_tokens": 19699696} {"current_steps": 30195, "total_steps": 33920, "loss": 0.323, "lr": 3.630790850855986e-07, "epoch": 17.80365566037736, "percentage": 89.02, "elapsed_time": "0:57:57", "remaining_time": "0:07:09", "throughput": 5665.02, "total_tokens": 19702928} {"current_steps": 30200, "total_steps": 33920, "loss": 0.2993, "lr": 3.62117219894762e-07, "epoch": 17.806603773584907, "percentage": 89.03, "elapsed_time": "0:57:58", "remaining_time": "0:07:08", "throughput": 5665.06, "total_tokens": 19706064} {"current_steps": 30205, "total_steps": 33920, "loss": 0.4681, "lr": 3.611565826033797e-07, "epoch": 17.809551886792452, "percentage": 89.05, "elapsed_time": "0:57:59", "remaining_time": "0:07:07", "throughput": 5665.13, "total_tokens": 19709520} {"current_steps": 30210, "total_steps": 33920, "loss": 0.3719, "lr": 3.6019717346578445e-07, "epoch": 17.8125, "percentage": 89.06, "elapsed_time": "0:58:00", "remaining_time": "0:07:07", "throughput": 5665.22, "total_tokens": 19716112} {"current_steps": 30215, "total_steps": 33920, "loss": 0.3702, "lr": 3.5923899273598293e-07, "epoch": 17.815448113207548, "percentage": 89.08, "elapsed_time": "0:58:00", "remaining_time": "0:07:06", "throughput": 5665.22, "total_tokens": 19719056} {"current_steps": 30220, "total_steps": 33920, "loss": 0.2669, "lr": 3.582820406676596e-07, "epoch": 17.818396226415093, "percentage": 89.09, "elapsed_time": "0:58:01", "remaining_time": "0:07:06", "throughput": 5665.12, "total_tokens": 19721456} {"current_steps": 30225, "total_steps": 33920, "loss": 0.3417, "lr": 3.5732631751417056e-07, "epoch": 17.82134433962264, "percentage": 89.11, "elapsed_time": "0:58:01", "remaining_time": "0:07:05", "throughput": 5665.13, "total_tokens": 19724432} {"current_steps": 30230, "total_steps": 33920, "loss": 0.356, "lr": 3.563718235285485e-07, "epoch": 17.82429245283019, "percentage": 89.12, "elapsed_time": "0:58:02", "remaining_time": "0:07:05", "throughput": 5665.24, "total_tokens": 19728496} {"current_steps": 30235, "total_steps": 33920, "loss": 0.2916, "lr": 3.5541855896349844e-07, "epoch": 17.827240566037737, "percentage": 89.14, "elapsed_time": "0:58:02", "remaining_time": "0:07:04", "throughput": 5665.18, "total_tokens": 19731120} {"current_steps": 30240, "total_steps": 33920, "loss": 0.2883, "lr": 3.544665240714018e-07, "epoch": 17.830188679245282, "percentage": 89.15, "elapsed_time": "0:58:03", "remaining_time": "0:07:03", "throughput": 5665.21, "total_tokens": 19734192} {"current_steps": 30245, "total_steps": 33920, "loss": 0.4068, "lr": 3.535157191043137e-07, "epoch": 17.83313679245283, "percentage": 89.17, "elapsed_time": "0:58:03", "remaining_time": "0:07:03", "throughput": 5665.23, "total_tokens": 19737104} {"current_steps": 30250, "total_steps": 33920, "loss": 0.3138, "lr": 3.5256614431396385e-07, "epoch": 17.83608490566038, "percentage": 89.18, "elapsed_time": "0:58:04", "remaining_time": "0:07:02", "throughput": 5665.23, "total_tokens": 19742480} {"current_steps": 30255, "total_steps": 33920, "loss": 0.2504, "lr": 3.516177999517578e-07, "epoch": 17.839033018867923, "percentage": 89.2, "elapsed_time": "0:58:05", "remaining_time": "0:07:02", "throughput": 5665.19, "total_tokens": 19745040} {"current_steps": 30260, "total_steps": 33920, "loss": 0.2715, "lr": 3.50670686268772e-07, "epoch": 17.84198113207547, "percentage": 89.21, "elapsed_time": "0:58:05", "remaining_time": "0:07:01", "throughput": 5665.15, "total_tokens": 19747664} {"current_steps": 30265, "total_steps": 33920, "loss": 0.3268, "lr": 3.497248035157602e-07, "epoch": 17.84492924528302, "percentage": 89.22, "elapsed_time": "0:58:06", "remaining_time": "0:07:01", "throughput": 5665.26, "total_tokens": 19751184} {"current_steps": 30270, "total_steps": 33920, "loss": 0.4222, "lr": 3.4878015194314773e-07, "epoch": 17.847877358490567, "percentage": 89.24, "elapsed_time": "0:58:06", "remaining_time": "0:07:00", "throughput": 5665.36, "total_tokens": 19754800} {"current_steps": 30275, "total_steps": 33920, "loss": 0.3148, "lr": 3.4783673180103617e-07, "epoch": 17.850825471698112, "percentage": 89.25, "elapsed_time": "0:58:07", "remaining_time": "0:06:59", "throughput": 5665.41, "total_tokens": 19757904} {"current_steps": 30280, "total_steps": 33920, "loss": 0.5146, "lr": 3.468945433391985e-07, "epoch": 17.85377358490566, "percentage": 89.27, "elapsed_time": "0:58:08", "remaining_time": "0:06:59", "throughput": 5665.29, "total_tokens": 19761392} {"current_steps": 30285, "total_steps": 33920, "loss": 0.2667, "lr": 3.459535868070851e-07, "epoch": 17.85672169811321, "percentage": 89.28, "elapsed_time": "0:58:08", "remaining_time": "0:06:58", "throughput": 5665.14, "total_tokens": 19763568} {"current_steps": 30290, "total_steps": 33920, "loss": 0.3641, "lr": 3.450138624538174e-07, "epoch": 17.859669811320753, "percentage": 89.3, "elapsed_time": "0:58:09", "remaining_time": "0:06:58", "throughput": 5665.14, "total_tokens": 19766704} {"current_steps": 30295, "total_steps": 33920, "loss": 0.2482, "lr": 3.440753705281913e-07, "epoch": 17.8626179245283, "percentage": 89.31, "elapsed_time": "0:58:09", "remaining_time": "0:06:57", "throughput": 5665.16, "total_tokens": 19769904} {"current_steps": 30300, "total_steps": 33920, "loss": 0.3732, "lr": 3.4313811127867693e-07, "epoch": 17.86556603773585, "percentage": 89.33, "elapsed_time": "0:58:10", "remaining_time": "0:06:56", "throughput": 5665.12, "total_tokens": 19772720} {"current_steps": 30305, "total_steps": 33920, "loss": 0.3046, "lr": 3.4220208495341745e-07, "epoch": 17.868514150943398, "percentage": 89.34, "elapsed_time": "0:58:10", "remaining_time": "0:06:56", "throughput": 5665.21, "total_tokens": 19776144} {"current_steps": 30310, "total_steps": 33920, "loss": 0.4016, "lr": 3.412672918002291e-07, "epoch": 17.871462264150942, "percentage": 89.36, "elapsed_time": "0:58:11", "remaining_time": "0:06:55", "throughput": 5665.33, "total_tokens": 19779824} {"current_steps": 30315, "total_steps": 33920, "loss": 0.236, "lr": 3.403337320666045e-07, "epoch": 17.87441037735849, "percentage": 89.37, "elapsed_time": "0:58:11", "remaining_time": "0:06:55", "throughput": 5665.32, "total_tokens": 19782832} {"current_steps": 30320, "total_steps": 33920, "loss": 0.2286, "lr": 3.394014059997064e-07, "epoch": 17.87735849056604, "percentage": 89.39, "elapsed_time": "0:58:12", "remaining_time": "0:06:54", "throughput": 5665.4, "total_tokens": 19786192} {"current_steps": 30325, "total_steps": 33920, "loss": 0.3561, "lr": 3.3847031384637185e-07, "epoch": 17.880306603773583, "percentage": 89.4, "elapsed_time": "0:58:13", "remaining_time": "0:06:54", "throughput": 5665.6, "total_tokens": 19790736} {"current_steps": 30330, "total_steps": 33920, "loss": 0.3541, "lr": 3.3754045585311147e-07, "epoch": 17.88325471698113, "percentage": 89.42, "elapsed_time": "0:58:13", "remaining_time": "0:06:53", "throughput": 5665.56, "total_tokens": 19793584} {"current_steps": 30335, "total_steps": 33920, "loss": 0.2574, "lr": 3.366118322661094e-07, "epoch": 17.88620283018868, "percentage": 89.43, "elapsed_time": "0:58:14", "remaining_time": "0:06:52", "throughput": 5665.81, "total_tokens": 19798832} {"current_steps": 30340, "total_steps": 33920, "loss": 0.3633, "lr": 3.3568444333122283e-07, "epoch": 17.889150943396228, "percentage": 89.45, "elapsed_time": "0:58:14", "remaining_time": "0:06:52", "throughput": 5665.85, "total_tokens": 19801936} {"current_steps": 30345, "total_steps": 33920, "loss": 0.3435, "lr": 3.347582892939816e-07, "epoch": 17.892099056603772, "percentage": 89.46, "elapsed_time": "0:58:15", "remaining_time": "0:06:51", "throughput": 5665.95, "total_tokens": 19805648} {"current_steps": 30350, "total_steps": 33920, "loss": 0.4421, "lr": 3.338333703995905e-07, "epoch": 17.89504716981132, "percentage": 89.48, "elapsed_time": "0:58:16", "remaining_time": "0:06:51", "throughput": 5665.89, "total_tokens": 19808240} {"current_steps": 30355, "total_steps": 33920, "loss": 0.3599, "lr": 3.329096868929238e-07, "epoch": 17.89799528301887, "percentage": 89.49, "elapsed_time": "0:58:16", "remaining_time": "0:06:50", "throughput": 5665.88, "total_tokens": 19811184} {"current_steps": 30360, "total_steps": 33920, "loss": 0.2981, "lr": 3.319872390185325e-07, "epoch": 17.900943396226417, "percentage": 89.5, "elapsed_time": "0:58:17", "remaining_time": "0:06:50", "throughput": 5665.89, "total_tokens": 19814064} {"current_steps": 30365, "total_steps": 33920, "loss": 0.3339, "lr": 3.3106602702063727e-07, "epoch": 17.90389150943396, "percentage": 89.52, "elapsed_time": "0:58:17", "remaining_time": "0:06:49", "throughput": 5665.81, "total_tokens": 19816976} {"current_steps": 30370, "total_steps": 33920, "loss": 0.2165, "lr": 3.3014605114313316e-07, "epoch": 17.90683962264151, "percentage": 89.53, "elapsed_time": "0:58:18", "remaining_time": "0:06:48", "throughput": 5665.89, "total_tokens": 19820240} {"current_steps": 30375, "total_steps": 33920, "loss": 0.2161, "lr": 3.2922731162958744e-07, "epoch": 17.909787735849058, "percentage": 89.55, "elapsed_time": "0:58:18", "remaining_time": "0:06:48", "throughput": 5665.79, "total_tokens": 19822608} {"current_steps": 30380, "total_steps": 33920, "loss": 0.289, "lr": 3.2830980872324114e-07, "epoch": 17.912735849056602, "percentage": 89.56, "elapsed_time": "0:58:19", "remaining_time": "0:06:47", "throughput": 5665.83, "total_tokens": 19825744} {"current_steps": 30385, "total_steps": 33920, "loss": 0.1966, "lr": 3.2739354266700775e-07, "epoch": 17.91568396226415, "percentage": 89.58, "elapsed_time": "0:58:19", "remaining_time": "0:06:47", "throughput": 5665.93, "total_tokens": 19829264} {"current_steps": 30390, "total_steps": 33920, "loss": 0.2513, "lr": 3.264785137034709e-07, "epoch": 17.9186320754717, "percentage": 89.59, "elapsed_time": "0:58:20", "remaining_time": "0:06:46", "throughput": 5665.8, "total_tokens": 19831728} {"current_steps": 30395, "total_steps": 33920, "loss": 0.2735, "lr": 3.2556472207488977e-07, "epoch": 17.921580188679247, "percentage": 89.61, "elapsed_time": "0:58:20", "remaining_time": "0:06:46", "throughput": 5665.99, "total_tokens": 19835664} {"current_steps": 30400, "total_steps": 33920, "loss": 0.3221, "lr": 3.246521680231934e-07, "epoch": 17.92452830188679, "percentage": 89.62, "elapsed_time": "0:58:21", "remaining_time": "0:06:45", "throughput": 5666.04, "total_tokens": 19838672} {"current_steps": 30405, "total_steps": 33920, "loss": 0.3461, "lr": 3.2374085178998594e-07, "epoch": 17.92747641509434, "percentage": 89.64, "elapsed_time": "0:58:21", "remaining_time": "0:06:44", "throughput": 5666.14, "total_tokens": 19841808} {"current_steps": 30410, "total_steps": 33920, "loss": 0.272, "lr": 3.2283077361654145e-07, "epoch": 17.930424528301888, "percentage": 89.65, "elapsed_time": "0:58:22", "remaining_time": "0:06:44", "throughput": 5666.14, "total_tokens": 19844528} {"current_steps": 30415, "total_steps": 33920, "loss": 0.2614, "lr": 3.2192193374380677e-07, "epoch": 17.933372641509433, "percentage": 89.67, "elapsed_time": "0:58:23", "remaining_time": "0:06:43", "throughput": 5666.3, "total_tokens": 19849360} {"current_steps": 30420, "total_steps": 33920, "loss": 0.2683, "lr": 3.210143324124021e-07, "epoch": 17.93632075471698, "percentage": 89.68, "elapsed_time": "0:58:24", "remaining_time": "0:06:43", "throughput": 5666.63, "total_tokens": 19856400} {"current_steps": 30425, "total_steps": 33920, "loss": 0.4036, "lr": 3.2010796986261805e-07, "epoch": 17.93926886792453, "percentage": 89.7, "elapsed_time": "0:58:24", "remaining_time": "0:06:42", "throughput": 5666.84, "total_tokens": 19860848} {"current_steps": 30430, "total_steps": 33920, "loss": 0.2543, "lr": 3.1920284633441713e-07, "epoch": 17.942216981132077, "percentage": 89.71, "elapsed_time": "0:58:25", "remaining_time": "0:06:42", "throughput": 5666.83, "total_tokens": 19863600} {"current_steps": 30435, "total_steps": 33920, "loss": 0.2435, "lr": 3.1829896206743704e-07, "epoch": 17.94516509433962, "percentage": 89.73, "elapsed_time": "0:58:25", "remaining_time": "0:06:41", "throughput": 5666.85, "total_tokens": 19866320} {"current_steps": 30440, "total_steps": 33920, "loss": 0.2821, "lr": 3.173963173009825e-07, "epoch": 17.94811320754717, "percentage": 89.74, "elapsed_time": "0:58:26", "remaining_time": "0:06:40", "throughput": 5666.86, "total_tokens": 19869040} {"current_steps": 30445, "total_steps": 33920, "loss": 0.3873, "lr": 3.164949122740352e-07, "epoch": 17.951061320754718, "percentage": 89.76, "elapsed_time": "0:58:26", "remaining_time": "0:06:40", "throughput": 5666.87, "total_tokens": 19871920} {"current_steps": 30450, "total_steps": 33920, "loss": 0.3104, "lr": 3.1559474722524406e-07, "epoch": 17.954009433962263, "percentage": 89.77, "elapsed_time": "0:58:27", "remaining_time": "0:06:39", "throughput": 5666.86, "total_tokens": 19874704} {"current_steps": 30455, "total_steps": 33920, "loss": 0.2786, "lr": 3.146958223929325e-07, "epoch": 17.95695754716981, "percentage": 89.78, "elapsed_time": "0:58:27", "remaining_time": "0:06:39", "throughput": 5666.86, "total_tokens": 19877520} {"current_steps": 30460, "total_steps": 33920, "loss": 0.452, "lr": 3.1379813801509454e-07, "epoch": 17.95990566037736, "percentage": 89.8, "elapsed_time": "0:58:28", "remaining_time": "0:06:38", "throughput": 5667.07, "total_tokens": 19881840} {"current_steps": 30465, "total_steps": 33920, "loss": 0.2294, "lr": 3.1290169432939556e-07, "epoch": 17.962853773584907, "percentage": 89.81, "elapsed_time": "0:58:28", "remaining_time": "0:06:37", "throughput": 5667.2, "total_tokens": 19885712} {"current_steps": 30470, "total_steps": 33920, "loss": 0.3337, "lr": 3.120064915731735e-07, "epoch": 17.965801886792452, "percentage": 89.83, "elapsed_time": "0:58:29", "remaining_time": "0:06:37", "throughput": 5667.33, "total_tokens": 19889328} {"current_steps": 30475, "total_steps": 33920, "loss": 0.2596, "lr": 3.1111252998343723e-07, "epoch": 17.96875, "percentage": 89.84, "elapsed_time": "0:58:30", "remaining_time": "0:06:36", "throughput": 5667.4, "total_tokens": 19892944} {"current_steps": 30480, "total_steps": 33920, "loss": 0.3538, "lr": 3.102198097968662e-07, "epoch": 17.971698113207548, "percentage": 89.86, "elapsed_time": "0:58:30", "remaining_time": "0:06:36", "throughput": 5667.41, "total_tokens": 19896144} {"current_steps": 30485, "total_steps": 33920, "loss": 0.2861, "lr": 3.093283312498124e-07, "epoch": 17.974646226415093, "percentage": 89.87, "elapsed_time": "0:58:31", "remaining_time": "0:06:35", "throughput": 5667.46, "total_tokens": 19899056} {"current_steps": 30490, "total_steps": 33920, "loss": 0.3174, "lr": 3.084380945782989e-07, "epoch": 17.97759433962264, "percentage": 89.89, "elapsed_time": "0:58:31", "remaining_time": "0:06:35", "throughput": 5667.51, "total_tokens": 19902064} {"current_steps": 30495, "total_steps": 33920, "loss": 0.2133, "lr": 3.0754910001801866e-07, "epoch": 17.98054245283019, "percentage": 89.9, "elapsed_time": "0:58:32", "remaining_time": "0:06:34", "throughput": 5667.65, "total_tokens": 19905616} {"current_steps": 30500, "total_steps": 33920, "loss": 0.2998, "lr": 3.0666134780433786e-07, "epoch": 17.983490566037737, "percentage": 89.92, "elapsed_time": "0:58:32", "remaining_time": "0:06:33", "throughput": 5667.63, "total_tokens": 19908336} {"current_steps": 30505, "total_steps": 33920, "loss": 0.3673, "lr": 3.0577483817229306e-07, "epoch": 17.986438679245282, "percentage": 89.93, "elapsed_time": "0:58:33", "remaining_time": "0:06:33", "throughput": 5667.62, "total_tokens": 19911152} {"current_steps": 30510, "total_steps": 33920, "loss": 0.3242, "lr": 3.0488957135659023e-07, "epoch": 17.98938679245283, "percentage": 89.95, "elapsed_time": "0:58:33", "remaining_time": "0:06:32", "throughput": 5667.73, "total_tokens": 19914640} {"current_steps": 30515, "total_steps": 33920, "loss": 0.2564, "lr": 3.040055475916087e-07, "epoch": 17.99233490566038, "percentage": 89.96, "elapsed_time": "0:58:34", "remaining_time": "0:06:32", "throughput": 5667.8, "total_tokens": 19917936} {"current_steps": 30520, "total_steps": 33920, "loss": 0.328, "lr": 3.0312276711139675e-07, "epoch": 17.995283018867923, "percentage": 89.98, "elapsed_time": "0:58:34", "remaining_time": "0:06:31", "throughput": 5667.94, "total_tokens": 19921776} {"current_steps": 30525, "total_steps": 33920, "loss": 0.3527, "lr": 3.0224123014967353e-07, "epoch": 17.99823113207547, "percentage": 89.99, "elapsed_time": "0:58:35", "remaining_time": "0:06:30", "throughput": 5667.97, "total_tokens": 19924848} {"current_steps": 30528, "total_steps": 33920, "eval_loss": 0.6273570656776428, "epoch": 18.0, "percentage": 90.0, "elapsed_time": "0:58:55", "remaining_time": "0:06:32", "throughput": 5636.66, "total_tokens": 19926608} {"current_steps": 30530, "total_steps": 33920, "loss": 0.2776, "lr": 3.013609369398324e-07, "epoch": 18.00117924528302, "percentage": 90.01, "elapsed_time": "0:58:58", "remaining_time": "0:06:32", "throughput": 5631.09, "total_tokens": 19927888} {"current_steps": 30535, "total_steps": 33920, "loss": 0.2073, "lr": 3.004818877149318e-07, "epoch": 18.004127358490567, "percentage": 90.02, "elapsed_time": "0:58:59", "remaining_time": "0:06:32", "throughput": 5630.99, "total_tokens": 19930608} {"current_steps": 30540, "total_steps": 33920, "loss": 0.3069, "lr": 2.9960408270770624e-07, "epoch": 18.007075471698112, "percentage": 90.04, "elapsed_time": "0:59:00", "remaining_time": "0:06:31", "throughput": 5630.96, "total_tokens": 19933872} {"current_steps": 30545, "total_steps": 33920, "loss": 0.3925, "lr": 2.9872752215055755e-07, "epoch": 18.01002358490566, "percentage": 90.05, "elapsed_time": "0:59:00", "remaining_time": "0:06:31", "throughput": 5630.99, "total_tokens": 19936944} {"current_steps": 30550, "total_steps": 33920, "loss": 0.3283, "lr": 2.9785220627555844e-07, "epoch": 18.01297169811321, "percentage": 90.06, "elapsed_time": "0:59:01", "remaining_time": "0:06:30", "throughput": 5630.92, "total_tokens": 19939536} {"current_steps": 30555, "total_steps": 33920, "loss": 0.3485, "lr": 2.9697813531445295e-07, "epoch": 18.015919811320753, "percentage": 90.08, "elapsed_time": "0:59:01", "remaining_time": "0:06:30", "throughput": 5630.72, "total_tokens": 19942512} {"current_steps": 30560, "total_steps": 33920, "loss": 0.2613, "lr": 2.9610530949865433e-07, "epoch": 18.0188679245283, "percentage": 90.09, "elapsed_time": "0:59:02", "remaining_time": "0:06:29", "throughput": 5630.7, "total_tokens": 19945840} {"current_steps": 30565, "total_steps": 33920, "loss": 0.3541, "lr": 2.952337290592483e-07, "epoch": 18.02181603773585, "percentage": 90.11, "elapsed_time": "0:59:02", "remaining_time": "0:06:28", "throughput": 5630.56, "total_tokens": 19948688} {"current_steps": 30570, "total_steps": 33920, "loss": 0.2613, "lr": 2.9436339422698913e-07, "epoch": 18.024764150943398, "percentage": 90.12, "elapsed_time": "0:59:03", "remaining_time": "0:06:28", "throughput": 5630.71, "total_tokens": 19952464} {"current_steps": 30575, "total_steps": 33920, "loss": 0.359, "lr": 2.934943052323008e-07, "epoch": 18.027712264150942, "percentage": 90.14, "elapsed_time": "0:59:04", "remaining_time": "0:06:27", "throughput": 5630.81, "total_tokens": 19956112} {"current_steps": 30580, "total_steps": 33920, "loss": 0.2984, "lr": 2.926264623052799e-07, "epoch": 18.03066037735849, "percentage": 90.15, "elapsed_time": "0:59:04", "remaining_time": "0:06:27", "throughput": 5630.9, "total_tokens": 19959472} {"current_steps": 30585, "total_steps": 33920, "loss": 0.2322, "lr": 2.9175986567569036e-07, "epoch": 18.03360849056604, "percentage": 90.17, "elapsed_time": "0:59:05", "remaining_time": "0:06:26", "throughput": 5630.75, "total_tokens": 19962224} {"current_steps": 30590, "total_steps": 33920, "loss": 0.259, "lr": 2.9089451557296755e-07, "epoch": 18.036556603773583, "percentage": 90.18, "elapsed_time": "0:59:05", "remaining_time": "0:06:25", "throughput": 5630.67, "total_tokens": 19965008} {"current_steps": 30595, "total_steps": 33920, "loss": 0.4284, "lr": 2.9003041222621706e-07, "epoch": 18.03950471698113, "percentage": 90.2, "elapsed_time": "0:59:06", "remaining_time": "0:06:25", "throughput": 5630.77, "total_tokens": 19968624} {"current_steps": 30600, "total_steps": 33920, "loss": 0.3152, "lr": 2.8916755586421375e-07, "epoch": 18.04245283018868, "percentage": 90.21, "elapsed_time": "0:59:06", "remaining_time": "0:06:24", "throughput": 5630.76, "total_tokens": 19971728} {"current_steps": 30605, "total_steps": 33920, "loss": 0.2578, "lr": 2.883059467154031e-07, "epoch": 18.045400943396228, "percentage": 90.23, "elapsed_time": "0:59:07", "remaining_time": "0:06:24", "throughput": 5630.8, "total_tokens": 19974768} {"current_steps": 30610, "total_steps": 33920, "loss": 0.3173, "lr": 2.8744558500789887e-07, "epoch": 18.048349056603772, "percentage": 90.24, "elapsed_time": "0:59:07", "remaining_time": "0:06:23", "throughput": 5630.89, "total_tokens": 19978384} {"current_steps": 30615, "total_steps": 33920, "loss": 0.4031, "lr": 2.8658647096948546e-07, "epoch": 18.05129716981132, "percentage": 90.26, "elapsed_time": "0:59:08", "remaining_time": "0:06:23", "throughput": 5630.95, "total_tokens": 19981872} {"current_steps": 30620, "total_steps": 33920, "loss": 0.2739, "lr": 2.8572860482761813e-07, "epoch": 18.05424528301887, "percentage": 90.27, "elapsed_time": "0:59:09", "remaining_time": "0:06:22", "throughput": 5630.93, "total_tokens": 19985232} {"current_steps": 30625, "total_steps": 33920, "loss": 0.5049, "lr": 2.8487198680942017e-07, "epoch": 18.057193396226417, "percentage": 90.29, "elapsed_time": "0:59:09", "remaining_time": "0:06:21", "throughput": 5630.81, "total_tokens": 19987824} {"current_steps": 30630, "total_steps": 33920, "loss": 0.2201, "lr": 2.840166171416836e-07, "epoch": 18.06014150943396, "percentage": 90.3, "elapsed_time": "0:59:10", "remaining_time": "0:06:21", "throughput": 5630.88, "total_tokens": 19991184} {"current_steps": 30635, "total_steps": 33920, "loss": 0.2935, "lr": 2.8316249605087386e-07, "epoch": 18.06308962264151, "percentage": 90.32, "elapsed_time": "0:59:10", "remaining_time": "0:06:20", "throughput": 5631.02, "total_tokens": 19994672} {"current_steps": 30640, "total_steps": 33920, "loss": 0.2354, "lr": 2.823096237631212e-07, "epoch": 18.066037735849058, "percentage": 90.33, "elapsed_time": "0:59:11", "remaining_time": "0:06:20", "throughput": 5631.04, "total_tokens": 19997744} {"current_steps": 30645, "total_steps": 33920, "loss": 0.2568, "lr": 2.814580005042283e-07, "epoch": 18.068985849056602, "percentage": 90.34, "elapsed_time": "0:59:11", "remaining_time": "0:06:19", "throughput": 5631.17, "total_tokens": 20001904} {"current_steps": 30650, "total_steps": 33920, "loss": 0.2637, "lr": 2.8060762649966435e-07, "epoch": 18.07193396226415, "percentage": 90.36, "elapsed_time": "0:59:12", "remaining_time": "0:06:19", "throughput": 5631.08, "total_tokens": 20004624} {"current_steps": 30655, "total_steps": 33920, "loss": 0.3086, "lr": 2.797585019745713e-07, "epoch": 18.0748820754717, "percentage": 90.37, "elapsed_time": "0:59:13", "remaining_time": "0:06:18", "throughput": 5631.09, "total_tokens": 20007824} {"current_steps": 30660, "total_steps": 33920, "loss": 0.2621, "lr": 2.789106271537584e-07, "epoch": 18.077830188679247, "percentage": 90.39, "elapsed_time": "0:59:13", "remaining_time": "0:06:17", "throughput": 5631.05, "total_tokens": 20010896} {"current_steps": 30665, "total_steps": 33920, "loss": 0.1847, "lr": 2.780640022617037e-07, "epoch": 18.08077830188679, "percentage": 90.4, "elapsed_time": "0:59:14", "remaining_time": "0:06:17", "throughput": 5631.15, "total_tokens": 20014160} {"current_steps": 30670, "total_steps": 33920, "loss": 0.2586, "lr": 2.772186275225547e-07, "epoch": 18.08372641509434, "percentage": 90.42, "elapsed_time": "0:59:14", "remaining_time": "0:06:16", "throughput": 5631.3, "total_tokens": 20017968} {"current_steps": 30675, "total_steps": 33920, "loss": 0.2762, "lr": 2.7637450316012836e-07, "epoch": 18.086674528301888, "percentage": 90.43, "elapsed_time": "0:59:15", "remaining_time": "0:06:16", "throughput": 5631.26, "total_tokens": 20020752} {"current_steps": 30680, "total_steps": 33920, "loss": 0.2624, "lr": 2.755316293979088e-07, "epoch": 18.089622641509433, "percentage": 90.45, "elapsed_time": "0:59:15", "remaining_time": "0:06:15", "throughput": 5631.33, "total_tokens": 20024688} {"current_steps": 30685, "total_steps": 33920, "loss": 0.3607, "lr": 2.7469000645905295e-07, "epoch": 18.09257075471698, "percentage": 90.46, "elapsed_time": "0:59:16", "remaining_time": "0:06:14", "throughput": 5631.38, "total_tokens": 20028016} {"current_steps": 30690, "total_steps": 33920, "loss": 0.3788, "lr": 2.738496345663827e-07, "epoch": 18.09551886792453, "percentage": 90.48, "elapsed_time": "0:59:17", "remaining_time": "0:06:14", "throughput": 5631.43, "total_tokens": 20031248} {"current_steps": 30695, "total_steps": 33920, "loss": 0.2775, "lr": 2.7301051394239e-07, "epoch": 18.098466981132077, "percentage": 90.49, "elapsed_time": "0:59:17", "remaining_time": "0:06:13", "throughput": 5631.33, "total_tokens": 20034128} {"current_steps": 30700, "total_steps": 33920, "loss": 0.1811, "lr": 2.72172644809236e-07, "epoch": 18.10141509433962, "percentage": 90.51, "elapsed_time": "0:59:18", "remaining_time": "0:06:13", "throughput": 5631.43, "total_tokens": 20038032} {"current_steps": 30705, "total_steps": 33920, "loss": 0.3259, "lr": 2.7133602738875e-07, "epoch": 18.10436320754717, "percentage": 90.52, "elapsed_time": "0:59:18", "remaining_time": "0:06:12", "throughput": 5631.43, "total_tokens": 20040880} {"current_steps": 30710, "total_steps": 33920, "loss": 0.3329, "lr": 2.7050066190242976e-07, "epoch": 18.107311320754718, "percentage": 90.54, "elapsed_time": "0:59:19", "remaining_time": "0:06:12", "throughput": 5631.59, "total_tokens": 20044720} {"current_steps": 30715, "total_steps": 33920, "loss": 0.2293, "lr": 2.696665485714428e-07, "epoch": 18.110259433962263, "percentage": 90.55, "elapsed_time": "0:59:19", "remaining_time": "0:06:11", "throughput": 5631.68, "total_tokens": 20047888} {"current_steps": 30720, "total_steps": 33920, "loss": 0.2933, "lr": 2.6883368761662367e-07, "epoch": 18.11320754716981, "percentage": 90.57, "elapsed_time": "0:59:20", "remaining_time": "0:06:10", "throughput": 5631.73, "total_tokens": 20050896} {"current_steps": 30725, "total_steps": 33920, "loss": 0.321, "lr": 2.680020792584759e-07, "epoch": 18.11615566037736, "percentage": 90.58, "elapsed_time": "0:59:20", "remaining_time": "0:06:10", "throughput": 5631.62, "total_tokens": 20053648} {"current_steps": 30730, "total_steps": 33920, "loss": 0.2552, "lr": 2.6717172371717113e-07, "epoch": 18.119103773584907, "percentage": 90.6, "elapsed_time": "0:59:21", "remaining_time": "0:06:09", "throughput": 5631.58, "total_tokens": 20056368} {"current_steps": 30735, "total_steps": 33920, "loss": 0.3099, "lr": 2.663426212125503e-07, "epoch": 18.122051886792452, "percentage": 90.61, "elapsed_time": "0:59:21", "remaining_time": "0:06:09", "throughput": 5631.4, "total_tokens": 20058672} {"current_steps": 30740, "total_steps": 33920, "loss": 0.4385, "lr": 2.655147719641216e-07, "epoch": 18.125, "percentage": 90.62, "elapsed_time": "0:59:22", "remaining_time": "0:06:08", "throughput": 5631.45, "total_tokens": 20061936} {"current_steps": 30745, "total_steps": 33920, "loss": 0.2967, "lr": 2.646881761910602e-07, "epoch": 18.127948113207548, "percentage": 90.64, "elapsed_time": "0:59:23", "remaining_time": "0:06:07", "throughput": 5631.37, "total_tokens": 20064560} {"current_steps": 30750, "total_steps": 33920, "loss": 0.3224, "lr": 2.638628341122135e-07, "epoch": 18.130896226415093, "percentage": 90.65, "elapsed_time": "0:59:23", "remaining_time": "0:06:07", "throughput": 5631.46, "total_tokens": 20068112} {"current_steps": 30755, "total_steps": 33920, "loss": 0.2529, "lr": 2.6303874594609314e-07, "epoch": 18.13384433962264, "percentage": 90.67, "elapsed_time": "0:59:24", "remaining_time": "0:06:06", "throughput": 5631.44, "total_tokens": 20070960} {"current_steps": 30760, "total_steps": 33920, "loss": 0.2808, "lr": 2.622159119108797e-07, "epoch": 18.13679245283019, "percentage": 90.68, "elapsed_time": "0:59:24", "remaining_time": "0:06:06", "throughput": 5631.48, "total_tokens": 20074224} {"current_steps": 30765, "total_steps": 33920, "loss": 0.2716, "lr": 2.6139433222442226e-07, "epoch": 18.139740566037737, "percentage": 90.7, "elapsed_time": "0:59:25", "remaining_time": "0:06:05", "throughput": 5631.54, "total_tokens": 20077648} {"current_steps": 30770, "total_steps": 33920, "loss": 0.181, "lr": 2.6057400710423787e-07, "epoch": 18.142688679245282, "percentage": 90.71, "elapsed_time": "0:59:25", "remaining_time": "0:06:05", "throughput": 5631.59, "total_tokens": 20081104} {"current_steps": 30775, "total_steps": 33920, "loss": 0.3386, "lr": 2.5975493676751004e-07, "epoch": 18.14563679245283, "percentage": 90.73, "elapsed_time": "0:59:26", "remaining_time": "0:06:04", "throughput": 5631.49, "total_tokens": 20083728} {"current_steps": 30780, "total_steps": 33920, "loss": 0.3307, "lr": 2.589371214310926e-07, "epoch": 18.14858490566038, "percentage": 90.74, "elapsed_time": "0:59:26", "remaining_time": "0:06:03", "throughput": 5631.47, "total_tokens": 20086832} {"current_steps": 30785, "total_steps": 33920, "loss": 0.2589, "lr": 2.581205613115051e-07, "epoch": 18.151533018867923, "percentage": 90.76, "elapsed_time": "0:59:27", "remaining_time": "0:06:03", "throughput": 5631.67, "total_tokens": 20090992} {"current_steps": 30790, "total_steps": 33920, "loss": 0.3204, "lr": 2.573052566249357e-07, "epoch": 18.15448113207547, "percentage": 90.77, "elapsed_time": "0:59:28", "remaining_time": "0:06:02", "throughput": 5631.62, "total_tokens": 20093776} {"current_steps": 30795, "total_steps": 33920, "loss": 0.3867, "lr": 2.5649120758723945e-07, "epoch": 18.15742924528302, "percentage": 90.79, "elapsed_time": "0:59:28", "remaining_time": "0:06:02", "throughput": 5631.75, "total_tokens": 20097232} {"current_steps": 30800, "total_steps": 33920, "loss": 0.2212, "lr": 2.5567841441393906e-07, "epoch": 18.160377358490567, "percentage": 90.8, "elapsed_time": "0:59:29", "remaining_time": "0:06:01", "throughput": 5631.91, "total_tokens": 20101328} {"current_steps": 30805, "total_steps": 33920, "loss": 0.2554, "lr": 2.548668773202245e-07, "epoch": 18.163325471698112, "percentage": 90.82, "elapsed_time": "0:59:29", "remaining_time": "0:06:00", "throughput": 5631.87, "total_tokens": 20103952} {"current_steps": 30810, "total_steps": 33920, "loss": 0.365, "lr": 2.5405659652095573e-07, "epoch": 18.16627358490566, "percentage": 90.83, "elapsed_time": "0:59:30", "remaining_time": "0:06:00", "throughput": 5631.88, "total_tokens": 20106736} {"current_steps": 30815, "total_steps": 33920, "loss": 0.2938, "lr": 2.5324757223065655e-07, "epoch": 18.16922169811321, "percentage": 90.85, "elapsed_time": "0:59:30", "remaining_time": "0:05:59", "throughput": 5631.9, "total_tokens": 20109808} {"current_steps": 30820, "total_steps": 33920, "loss": 0.5024, "lr": 2.524398046635207e-07, "epoch": 18.172169811320753, "percentage": 90.86, "elapsed_time": "0:59:31", "remaining_time": "0:05:59", "throughput": 5632.01, "total_tokens": 20113648} {"current_steps": 30825, "total_steps": 33920, "loss": 0.2344, "lr": 2.51633294033406e-07, "epoch": 18.1751179245283, "percentage": 90.88, "elapsed_time": "0:59:31", "remaining_time": "0:05:58", "throughput": 5632.13, "total_tokens": 20117328} {"current_steps": 30830, "total_steps": 33920, "loss": 0.27, "lr": 2.5082804055384214e-07, "epoch": 18.17806603773585, "percentage": 90.89, "elapsed_time": "0:59:32", "remaining_time": "0:05:58", "throughput": 5632.1, "total_tokens": 20120368} {"current_steps": 30835, "total_steps": 33920, "loss": 0.3116, "lr": 2.50024044438022e-07, "epoch": 18.181014150943398, "percentage": 90.91, "elapsed_time": "0:59:32", "remaining_time": "0:05:57", "throughput": 5632.03, "total_tokens": 20122928} {"current_steps": 30840, "total_steps": 33920, "loss": 0.2658, "lr": 2.492213058988069e-07, "epoch": 18.183962264150942, "percentage": 90.92, "elapsed_time": "0:59:33", "remaining_time": "0:05:56", "throughput": 5632.08, "total_tokens": 20126384} {"current_steps": 30845, "total_steps": 33920, "loss": 0.1827, "lr": 2.4841982514872633e-07, "epoch": 18.18691037735849, "percentage": 90.93, "elapsed_time": "0:59:34", "remaining_time": "0:05:56", "throughput": 5632.13, "total_tokens": 20129488} {"current_steps": 30850, "total_steps": 33920, "loss": 0.3116, "lr": 2.4761960239997497e-07, "epoch": 18.18985849056604, "percentage": 90.95, "elapsed_time": "0:59:34", "remaining_time": "0:05:55", "throughput": 5632.07, "total_tokens": 20132176} {"current_steps": 30855, "total_steps": 33920, "loss": 0.3685, "lr": 2.4682063786441556e-07, "epoch": 18.192806603773583, "percentage": 90.96, "elapsed_time": "0:59:35", "remaining_time": "0:05:55", "throughput": 5632.14, "total_tokens": 20135696} {"current_steps": 30860, "total_steps": 33920, "loss": 0.3455, "lr": 2.460229317535778e-07, "epoch": 18.19575471698113, "percentage": 90.98, "elapsed_time": "0:59:35", "remaining_time": "0:05:54", "throughput": 5632.15, "total_tokens": 20138576} {"current_steps": 30865, "total_steps": 33920, "loss": 0.3234, "lr": 2.4522648427865725e-07, "epoch": 18.19870283018868, "percentage": 90.99, "elapsed_time": "0:59:36", "remaining_time": "0:05:53", "throughput": 5632.29, "total_tokens": 20142256} {"current_steps": 30870, "total_steps": 33920, "loss": 0.285, "lr": 2.444312956505163e-07, "epoch": 18.201650943396228, "percentage": 91.01, "elapsed_time": "0:59:36", "remaining_time": "0:05:53", "throughput": 5632.32, "total_tokens": 20145808} {"current_steps": 30875, "total_steps": 33920, "loss": 0.4278, "lr": 2.4363736607968537e-07, "epoch": 18.204599056603772, "percentage": 91.02, "elapsed_time": "0:59:37", "remaining_time": "0:05:52", "throughput": 5632.25, "total_tokens": 20148432} {"current_steps": 30880, "total_steps": 33920, "loss": 0.2909, "lr": 2.428446957763608e-07, "epoch": 18.20754716981132, "percentage": 91.04, "elapsed_time": "0:59:37", "remaining_time": "0:05:52", "throughput": 5632.12, "total_tokens": 20150800} {"current_steps": 30885, "total_steps": 33920, "loss": 0.2139, "lr": 2.4205328495040535e-07, "epoch": 18.21049528301887, "percentage": 91.05, "elapsed_time": "0:59:38", "remaining_time": "0:05:51", "throughput": 5632.34, "total_tokens": 20155728} {"current_steps": 30890, "total_steps": 33920, "loss": 0.3497, "lr": 2.412631338113486e-07, "epoch": 18.213443396226417, "percentage": 91.07, "elapsed_time": "0:59:39", "remaining_time": "0:05:51", "throughput": 5632.34, "total_tokens": 20158608} {"current_steps": 30895, "total_steps": 33920, "loss": 0.4422, "lr": 2.404742425683848e-07, "epoch": 18.21639150943396, "percentage": 91.08, "elapsed_time": "0:59:39", "remaining_time": "0:05:50", "throughput": 5632.41, "total_tokens": 20161904} {"current_steps": 30900, "total_steps": 33920, "loss": 0.4067, "lr": 2.3968661143037864e-07, "epoch": 18.21933962264151, "percentage": 91.1, "elapsed_time": "0:59:40", "remaining_time": "0:05:49", "throughput": 5632.52, "total_tokens": 20165296} {"current_steps": 30905, "total_steps": 33920, "loss": 0.4141, "lr": 2.3890024060585823e-07, "epoch": 18.222287735849058, "percentage": 91.11, "elapsed_time": "0:59:40", "remaining_time": "0:05:49", "throughput": 5632.54, "total_tokens": 20168400} {"current_steps": 30910, "total_steps": 33920, "loss": 0.349, "lr": 2.3811513030301826e-07, "epoch": 18.225235849056602, "percentage": 91.13, "elapsed_time": "0:59:41", "remaining_time": "0:05:48", "throughput": 5632.55, "total_tokens": 20172080} {"current_steps": 30915, "total_steps": 33920, "loss": 0.2551, "lr": 2.373312807297201e-07, "epoch": 18.22818396226415, "percentage": 91.14, "elapsed_time": "0:59:41", "remaining_time": "0:05:48", "throughput": 5632.57, "total_tokens": 20175088} {"current_steps": 30920, "total_steps": 33920, "loss": 0.2623, "lr": 2.3654869209349007e-07, "epoch": 18.2311320754717, "percentage": 91.16, "elapsed_time": "0:59:42", "remaining_time": "0:05:47", "throughput": 5632.56, "total_tokens": 20178096} {"current_steps": 30925, "total_steps": 33920, "loss": 0.253, "lr": 2.357673646015246e-07, "epoch": 18.234080188679247, "percentage": 91.17, "elapsed_time": "0:59:42", "remaining_time": "0:05:46", "throughput": 5632.54, "total_tokens": 20180848} {"current_steps": 30930, "total_steps": 33920, "loss": 0.2387, "lr": 2.3498729846068103e-07, "epoch": 18.23702830188679, "percentage": 91.19, "elapsed_time": "0:59:43", "remaining_time": "0:05:46", "throughput": 5632.51, "total_tokens": 20183536} {"current_steps": 30935, "total_steps": 33920, "loss": 0.5658, "lr": 2.342084938774869e-07, "epoch": 18.23997641509434, "percentage": 91.2, "elapsed_time": "0:59:43", "remaining_time": "0:05:45", "throughput": 5632.43, "total_tokens": 20186000} {"current_steps": 30940, "total_steps": 33920, "loss": 0.3096, "lr": 2.334309510581334e-07, "epoch": 18.242924528301888, "percentage": 91.21, "elapsed_time": "0:59:44", "remaining_time": "0:05:45", "throughput": 5632.3, "total_tokens": 20188240} {"current_steps": 30945, "total_steps": 33920, "loss": 0.3215, "lr": 2.3265467020847864e-07, "epoch": 18.245872641509433, "percentage": 91.23, "elapsed_time": "0:59:44", "remaining_time": "0:05:44", "throughput": 5632.11, "total_tokens": 20190512} {"current_steps": 30950, "total_steps": 33920, "loss": 0.3134, "lr": 2.31879651534046e-07, "epoch": 18.24882075471698, "percentage": 91.24, "elapsed_time": "0:59:45", "remaining_time": "0:05:44", "throughput": 5632.01, "total_tokens": 20193040} {"current_steps": 30955, "total_steps": 33920, "loss": 0.4113, "lr": 2.311058952400247e-07, "epoch": 18.25176886792453, "percentage": 91.26, "elapsed_time": "0:59:46", "remaining_time": "0:05:43", "throughput": 5631.92, "total_tokens": 20196432} {"current_steps": 30960, "total_steps": 33920, "loss": 0.3499, "lr": 2.3033340153127026e-07, "epoch": 18.254716981132077, "percentage": 91.27, "elapsed_time": "0:59:46", "remaining_time": "0:05:42", "throughput": 5631.8, "total_tokens": 20198800} {"current_steps": 30965, "total_steps": 33920, "loss": 0.4237, "lr": 2.295621706123041e-07, "epoch": 18.25766509433962, "percentage": 91.29, "elapsed_time": "0:59:47", "remaining_time": "0:05:42", "throughput": 5631.86, "total_tokens": 20202384} {"current_steps": 30970, "total_steps": 33920, "loss": 0.3298, "lr": 2.287922026873135e-07, "epoch": 18.26061320754717, "percentage": 91.3, "elapsed_time": "0:59:47", "remaining_time": "0:05:41", "throughput": 5632.01, "total_tokens": 20206832} {"current_steps": 30975, "total_steps": 33920, "loss": 0.2324, "lr": 2.2802349796014923e-07, "epoch": 18.263561320754718, "percentage": 91.32, "elapsed_time": "0:59:48", "remaining_time": "0:05:41", "throughput": 5632.03, "total_tokens": 20209904} {"current_steps": 30980, "total_steps": 33920, "loss": 0.1808, "lr": 2.2725605663433013e-07, "epoch": 18.266509433962263, "percentage": 91.33, "elapsed_time": "0:59:48", "remaining_time": "0:05:40", "throughput": 5632.14, "total_tokens": 20213712} {"current_steps": 30985, "total_steps": 33920, "loss": 0.2718, "lr": 2.264898789130393e-07, "epoch": 18.26945754716981, "percentage": 91.35, "elapsed_time": "0:59:49", "remaining_time": "0:05:40", "throughput": 5632.22, "total_tokens": 20216976} {"current_steps": 30990, "total_steps": 33920, "loss": 0.3002, "lr": 2.2572496499912554e-07, "epoch": 18.27240566037736, "percentage": 91.36, "elapsed_time": "0:59:50", "remaining_time": "0:05:39", "throughput": 5632.13, "total_tokens": 20219408} {"current_steps": 30995, "total_steps": 33920, "loss": 0.3919, "lr": 2.2496131509510354e-07, "epoch": 18.275353773584907, "percentage": 91.38, "elapsed_time": "0:59:51", "remaining_time": "0:05:38", "throughput": 5632.4, "total_tokens": 20226672} {"current_steps": 31000, "total_steps": 33920, "loss": 0.2783, "lr": 2.2419892940315268e-07, "epoch": 18.278301886792452, "percentage": 91.39, "elapsed_time": "0:59:51", "remaining_time": "0:05:38", "throughput": 5632.52, "total_tokens": 20230448} {"current_steps": 31005, "total_steps": 33920, "loss": 0.3248, "lr": 2.2343780812511819e-07, "epoch": 18.28125, "percentage": 91.41, "elapsed_time": "0:59:52", "remaining_time": "0:05:37", "throughput": 5632.57, "total_tokens": 20233936} {"current_steps": 31010, "total_steps": 33920, "loss": 0.3385, "lr": 2.2267795146250936e-07, "epoch": 18.284198113207548, "percentage": 91.42, "elapsed_time": "0:59:52", "remaining_time": "0:05:37", "throughput": 5632.58, "total_tokens": 20237232} {"current_steps": 31015, "total_steps": 33920, "loss": 0.3543, "lr": 2.2191935961650146e-07, "epoch": 18.287146226415093, "percentage": 91.44, "elapsed_time": "0:59:53", "remaining_time": "0:05:36", "throughput": 5632.55, "total_tokens": 20240112} {"current_steps": 31020, "total_steps": 33920, "loss": 0.4193, "lr": 2.2116203278793603e-07, "epoch": 18.29009433962264, "percentage": 91.45, "elapsed_time": "0:59:54", "remaining_time": "0:05:35", "throughput": 5632.65, "total_tokens": 20243856} {"current_steps": 31025, "total_steps": 33920, "loss": 0.3104, "lr": 2.2040597117731766e-07, "epoch": 18.29304245283019, "percentage": 91.47, "elapsed_time": "0:59:54", "remaining_time": "0:05:35", "throughput": 5632.61, "total_tokens": 20246704} {"current_steps": 31030, "total_steps": 33920, "loss": 0.1606, "lr": 2.1965117498481793e-07, "epoch": 18.295990566037737, "percentage": 91.48, "elapsed_time": "0:59:55", "remaining_time": "0:05:34", "throughput": 5632.87, "total_tokens": 20252592} {"current_steps": 31035, "total_steps": 33920, "loss": 0.3302, "lr": 2.188976444102714e-07, "epoch": 18.298938679245282, "percentage": 91.49, "elapsed_time": "0:59:56", "remaining_time": "0:05:34", "throughput": 5633.06, "total_tokens": 20256976} {"current_steps": 31040, "total_steps": 33920, "loss": 0.3509, "lr": 2.181453796531796e-07, "epoch": 18.30188679245283, "percentage": 91.51, "elapsed_time": "0:59:56", "remaining_time": "0:05:33", "throughput": 5633.13, "total_tokens": 20260464} {"current_steps": 31045, "total_steps": 33920, "loss": 0.2147, "lr": 2.1739438091270658e-07, "epoch": 18.30483490566038, "percentage": 91.52, "elapsed_time": "0:59:57", "remaining_time": "0:05:33", "throughput": 5633.02, "total_tokens": 20262864} {"current_steps": 31050, "total_steps": 33920, "loss": 0.2624, "lr": 2.1664464838768329e-07, "epoch": 18.307783018867923, "percentage": 91.54, "elapsed_time": "0:59:57", "remaining_time": "0:05:32", "throughput": 5632.99, "total_tokens": 20265744} {"current_steps": 31055, "total_steps": 33920, "loss": 0.2706, "lr": 2.1589618227660426e-07, "epoch": 18.31073113207547, "percentage": 91.55, "elapsed_time": "0:59:58", "remaining_time": "0:05:31", "throughput": 5632.84, "total_tokens": 20268272} {"current_steps": 31060, "total_steps": 33920, "loss": 0.3173, "lr": 2.151489827776293e-07, "epoch": 18.31367924528302, "percentage": 91.57, "elapsed_time": "0:59:58", "remaining_time": "0:05:31", "throughput": 5632.86, "total_tokens": 20271088} {"current_steps": 31065, "total_steps": 33920, "loss": 0.3216, "lr": 2.1440305008858298e-07, "epoch": 18.316627358490567, "percentage": 91.58, "elapsed_time": "0:59:59", "remaining_time": "0:05:30", "throughput": 5632.79, "total_tokens": 20273680} {"current_steps": 31070, "total_steps": 33920, "loss": 0.2761, "lr": 2.1365838440695397e-07, "epoch": 18.319575471698112, "percentage": 91.6, "elapsed_time": "0:59:59", "remaining_time": "0:05:30", "throughput": 5632.86, "total_tokens": 20277232} {"current_steps": 31075, "total_steps": 33920, "loss": 0.4049, "lr": 2.129149859298957e-07, "epoch": 18.32252358490566, "percentage": 91.61, "elapsed_time": "1:00:00", "remaining_time": "0:05:29", "throughput": 5632.97, "total_tokens": 20280816} {"current_steps": 31080, "total_steps": 33920, "loss": 0.2688, "lr": 2.1217285485422622e-07, "epoch": 18.32547169811321, "percentage": 91.63, "elapsed_time": "1:00:00", "remaining_time": "0:05:29", "throughput": 5632.95, "total_tokens": 20283920} {"current_steps": 31085, "total_steps": 33920, "loss": 0.3839, "lr": 2.114319913764268e-07, "epoch": 18.328419811320753, "percentage": 91.64, "elapsed_time": "1:00:01", "remaining_time": "0:05:28", "throughput": 5633.0, "total_tokens": 20287472} {"current_steps": 31090, "total_steps": 33920, "loss": 0.2511, "lr": 2.10692395692646e-07, "epoch": 18.3313679245283, "percentage": 91.66, "elapsed_time": "1:00:02", "remaining_time": "0:05:27", "throughput": 5633.0, "total_tokens": 20290448} {"current_steps": 31095, "total_steps": 33920, "loss": 0.2557, "lr": 2.0995406799869444e-07, "epoch": 18.33431603773585, "percentage": 91.67, "elapsed_time": "1:00:02", "remaining_time": "0:05:27", "throughput": 5633.16, "total_tokens": 20294448} {"current_steps": 31100, "total_steps": 33920, "loss": 0.307, "lr": 2.0921700849004743e-07, "epoch": 18.337264150943398, "percentage": 91.69, "elapsed_time": "1:00:03", "remaining_time": "0:05:26", "throughput": 5633.28, "total_tokens": 20298256} {"current_steps": 31105, "total_steps": 33920, "loss": 0.2463, "lr": 2.084812173618439e-07, "epoch": 18.340212264150942, "percentage": 91.7, "elapsed_time": "1:00:03", "remaining_time": "0:05:26", "throughput": 5633.31, "total_tokens": 20301456} {"current_steps": 31110, "total_steps": 33920, "loss": 0.2524, "lr": 2.0774669480888853e-07, "epoch": 18.34316037735849, "percentage": 91.72, "elapsed_time": "1:00:04", "remaining_time": "0:05:25", "throughput": 5633.28, "total_tokens": 20304144} {"current_steps": 31115, "total_steps": 33920, "loss": 0.2215, "lr": 2.0701344102564912e-07, "epoch": 18.34610849056604, "percentage": 91.73, "elapsed_time": "1:00:04", "remaining_time": "0:05:24", "throughput": 5633.14, "total_tokens": 20306480} {"current_steps": 31120, "total_steps": 33920, "loss": 0.2812, "lr": 2.062814562062576e-07, "epoch": 18.349056603773583, "percentage": 91.75, "elapsed_time": "1:00:05", "remaining_time": "0:05:24", "throughput": 5633.09, "total_tokens": 20309072} {"current_steps": 31125, "total_steps": 33920, "loss": 0.4939, "lr": 2.0555074054451063e-07, "epoch": 18.35200471698113, "percentage": 91.76, "elapsed_time": "1:00:05", "remaining_time": "0:05:23", "throughput": 5633.07, "total_tokens": 20311856} {"current_steps": 31130, "total_steps": 33920, "loss": 0.3563, "lr": 2.0482129423386843e-07, "epoch": 18.35495283018868, "percentage": 91.77, "elapsed_time": "1:00:06", "remaining_time": "0:05:23", "throughput": 5633.18, "total_tokens": 20315600} {"current_steps": 31135, "total_steps": 33920, "loss": 0.2881, "lr": 2.040931174674543e-07, "epoch": 18.357900943396228, "percentage": 91.79, "elapsed_time": "1:00:06", "remaining_time": "0:05:22", "throughput": 5633.12, "total_tokens": 20318480} {"current_steps": 31140, "total_steps": 33920, "loss": 0.1799, "lr": 2.0336621043805682e-07, "epoch": 18.360849056603772, "percentage": 91.8, "elapsed_time": "1:00:07", "remaining_time": "0:05:22", "throughput": 5632.95, "total_tokens": 20321008} {"current_steps": 31145, "total_steps": 33920, "loss": 0.2926, "lr": 2.0264057333812704e-07, "epoch": 18.36379716981132, "percentage": 91.82, "elapsed_time": "1:00:08", "remaining_time": "0:05:21", "throughput": 5632.83, "total_tokens": 20323728} {"current_steps": 31150, "total_steps": 33920, "loss": 0.2844, "lr": 2.0191620635978127e-07, "epoch": 18.36674528301887, "percentage": 91.83, "elapsed_time": "1:00:08", "remaining_time": "0:05:20", "throughput": 5632.92, "total_tokens": 20327504} {"current_steps": 31155, "total_steps": 33920, "loss": 0.3416, "lr": 2.0119310969479833e-07, "epoch": 18.369693396226417, "percentage": 91.85, "elapsed_time": "1:00:09", "remaining_time": "0:05:20", "throughput": 5632.98, "total_tokens": 20331088} {"current_steps": 31160, "total_steps": 33920, "loss": 0.2262, "lr": 2.004712835346212e-07, "epoch": 18.37264150943396, "percentage": 91.86, "elapsed_time": "1:00:09", "remaining_time": "0:05:19", "throughput": 5633.01, "total_tokens": 20334352} {"current_steps": 31165, "total_steps": 33920, "loss": 0.2664, "lr": 1.99750728070357e-07, "epoch": 18.37558962264151, "percentage": 91.88, "elapsed_time": "1:00:10", "remaining_time": "0:05:19", "throughput": 5633.0, "total_tokens": 20337456} {"current_steps": 31170, "total_steps": 33920, "loss": 0.3164, "lr": 1.9903144349277536e-07, "epoch": 18.378537735849058, "percentage": 91.89, "elapsed_time": "1:00:10", "remaining_time": "0:05:18", "throughput": 5633.12, "total_tokens": 20341072} {"current_steps": 31175, "total_steps": 33920, "loss": 0.2525, "lr": 1.983134299923095e-07, "epoch": 18.381485849056602, "percentage": 91.91, "elapsed_time": "1:00:11", "remaining_time": "0:05:17", "throughput": 5633.05, "total_tokens": 20343632} {"current_steps": 31180, "total_steps": 33920, "loss": 0.3141, "lr": 1.9759668775905737e-07, "epoch": 18.38443396226415, "percentage": 91.92, "elapsed_time": "1:00:12", "remaining_time": "0:05:17", "throughput": 5633.14, "total_tokens": 20346928} {"current_steps": 31185, "total_steps": 33920, "loss": 0.2668, "lr": 1.9688121698277995e-07, "epoch": 18.3873820754717, "percentage": 91.94, "elapsed_time": "1:00:12", "remaining_time": "0:05:16", "throughput": 5633.2, "total_tokens": 20350032} {"current_steps": 31190, "total_steps": 33920, "loss": 0.2537, "lr": 1.9616701785290015e-07, "epoch": 18.390330188679247, "percentage": 91.95, "elapsed_time": "1:00:13", "remaining_time": "0:05:16", "throughput": 5633.21, "total_tokens": 20353200} {"current_steps": 31195, "total_steps": 33920, "loss": 0.4038, "lr": 1.954540905585056e-07, "epoch": 18.39327830188679, "percentage": 91.97, "elapsed_time": "1:00:13", "remaining_time": "0:05:15", "throughput": 5633.2, "total_tokens": 20356080} {"current_steps": 31200, "total_steps": 33920, "loss": 0.2868, "lr": 1.9474243528834757e-07, "epoch": 18.39622641509434, "percentage": 91.98, "elapsed_time": "1:00:14", "remaining_time": "0:05:15", "throughput": 5633.21, "total_tokens": 20359280} {"current_steps": 31205, "total_steps": 33920, "loss": 0.2359, "lr": 1.9403205223083866e-07, "epoch": 18.399174528301888, "percentage": 92.0, "elapsed_time": "1:00:14", "remaining_time": "0:05:14", "throughput": 5633.17, "total_tokens": 20362448} {"current_steps": 31210, "total_steps": 33920, "loss": 0.3469, "lr": 1.9332294157405619e-07, "epoch": 18.402122641509433, "percentage": 92.01, "elapsed_time": "1:00:15", "remaining_time": "0:05:13", "throughput": 5633.14, "total_tokens": 20365904} {"current_steps": 31215, "total_steps": 33920, "loss": 0.2711, "lr": 1.926151035057411e-07, "epoch": 18.40507075471698, "percentage": 92.03, "elapsed_time": "1:00:15", "remaining_time": "0:05:13", "throughput": 5633.16, "total_tokens": 20368880} {"current_steps": 31220, "total_steps": 33920, "loss": 0.2884, "lr": 1.9190853821329626e-07, "epoch": 18.40801886792453, "percentage": 92.04, "elapsed_time": "1:00:16", "remaining_time": "0:05:12", "throughput": 5633.19, "total_tokens": 20371920} {"current_steps": 31225, "total_steps": 33920, "loss": 0.4157, "lr": 1.9120324588378757e-07, "epoch": 18.410966981132077, "percentage": 92.05, "elapsed_time": "1:00:16", "remaining_time": "0:05:12", "throughput": 5633.3, "total_tokens": 20375440} {"current_steps": 31230, "total_steps": 33920, "loss": 0.3652, "lr": 1.9049922670394461e-07, "epoch": 18.41391509433962, "percentage": 92.07, "elapsed_time": "1:00:17", "remaining_time": "0:05:11", "throughput": 5633.39, "total_tokens": 20378992} {"current_steps": 31235, "total_steps": 33920, "loss": 0.2763, "lr": 1.897964808601588e-07, "epoch": 18.41686320754717, "percentage": 92.08, "elapsed_time": "1:00:18", "remaining_time": "0:05:11", "throughput": 5633.33, "total_tokens": 20381616} {"current_steps": 31240, "total_steps": 33920, "loss": 0.2763, "lr": 1.8909500853848517e-07, "epoch": 18.419811320754718, "percentage": 92.1, "elapsed_time": "1:00:18", "remaining_time": "0:05:10", "throughput": 5633.29, "total_tokens": 20384880} {"current_steps": 31245, "total_steps": 33920, "loss": 0.4847, "lr": 1.8839480992464243e-07, "epoch": 18.422759433962263, "percentage": 92.11, "elapsed_time": "1:00:19", "remaining_time": "0:05:09", "throughput": 5633.35, "total_tokens": 20388048} {"current_steps": 31250, "total_steps": 33920, "loss": 0.3937, "lr": 1.8769588520401005e-07, "epoch": 18.42570754716981, "percentage": 92.13, "elapsed_time": "1:00:19", "remaining_time": "0:05:09", "throughput": 5633.41, "total_tokens": 20391824} {"current_steps": 31255, "total_steps": 33920, "loss": 0.2707, "lr": 1.8699823456163279e-07, "epoch": 18.42865566037736, "percentage": 92.14, "elapsed_time": "1:00:20", "remaining_time": "0:05:08", "throughput": 5633.45, "total_tokens": 20395280} {"current_steps": 31260, "total_steps": 33920, "loss": 0.3827, "lr": 1.8630185818221514e-07, "epoch": 18.431603773584907, "percentage": 92.16, "elapsed_time": "1:00:20", "remaining_time": "0:05:08", "throughput": 5633.46, "total_tokens": 20398320} {"current_steps": 31265, "total_steps": 33920, "loss": 0.3208, "lr": 1.856067562501268e-07, "epoch": 18.434551886792452, "percentage": 92.17, "elapsed_time": "1:00:21", "remaining_time": "0:05:07", "throughput": 5633.37, "total_tokens": 20400944} {"current_steps": 31270, "total_steps": 33920, "loss": 0.2665, "lr": 1.8491292894939837e-07, "epoch": 18.4375, "percentage": 92.19, "elapsed_time": "1:00:21", "remaining_time": "0:05:06", "throughput": 5633.4, "total_tokens": 20404112} {"current_steps": 31275, "total_steps": 33920, "loss": 0.2769, "lr": 1.8422037646372405e-07, "epoch": 18.440448113207548, "percentage": 92.2, "elapsed_time": "1:00:22", "remaining_time": "0:05:06", "throughput": 5633.47, "total_tokens": 20408048} {"current_steps": 31280, "total_steps": 33920, "loss": 0.3773, "lr": 1.8352909897645989e-07, "epoch": 18.443396226415093, "percentage": 92.22, "elapsed_time": "1:00:23", "remaining_time": "0:05:05", "throughput": 5633.58, "total_tokens": 20411792} {"current_steps": 31285, "total_steps": 33920, "loss": 0.3554, "lr": 1.8283909667062448e-07, "epoch": 18.44634433962264, "percentage": 92.23, "elapsed_time": "1:00:23", "remaining_time": "0:05:05", "throughput": 5633.59, "total_tokens": 20414896} {"current_steps": 31290, "total_steps": 33920, "loss": 0.2903, "lr": 1.82150369728899e-07, "epoch": 18.44929245283019, "percentage": 92.25, "elapsed_time": "1:00:24", "remaining_time": "0:05:04", "throughput": 5633.61, "total_tokens": 20417744} {"current_steps": 31295, "total_steps": 33920, "loss": 0.274, "lr": 1.814629183336275e-07, "epoch": 18.452240566037737, "percentage": 92.26, "elapsed_time": "1:00:24", "remaining_time": "0:05:04", "throughput": 5633.76, "total_tokens": 20421552} {"current_steps": 31300, "total_steps": 33920, "loss": 0.3764, "lr": 1.807767426668139e-07, "epoch": 18.455188679245282, "percentage": 92.28, "elapsed_time": "1:00:25", "remaining_time": "0:05:03", "throughput": 5633.75, "total_tokens": 20424400} {"current_steps": 31305, "total_steps": 33920, "loss": 0.2896, "lr": 1.8009184291012783e-07, "epoch": 18.45813679245283, "percentage": 92.29, "elapsed_time": "1:00:25", "remaining_time": "0:05:02", "throughput": 5633.69, "total_tokens": 20427600} {"current_steps": 31310, "total_steps": 33920, "loss": 0.3118, "lr": 1.7940821924489926e-07, "epoch": 18.46108490566038, "percentage": 92.31, "elapsed_time": "1:00:26", "remaining_time": "0:05:02", "throughput": 5633.8, "total_tokens": 20431568} {"current_steps": 31315, "total_steps": 33920, "loss": 0.3353, "lr": 1.7872587185212009e-07, "epoch": 18.464033018867923, "percentage": 92.32, "elapsed_time": "1:00:27", "remaining_time": "0:05:01", "throughput": 5633.8, "total_tokens": 20434704} {"current_steps": 31320, "total_steps": 33920, "loss": 0.3823, "lr": 1.7804480091244524e-07, "epoch": 18.46698113207547, "percentage": 92.33, "elapsed_time": "1:00:27", "remaining_time": "0:05:01", "throughput": 5633.8, "total_tokens": 20437968} {"current_steps": 31325, "total_steps": 33920, "loss": 0.3554, "lr": 1.7736500660619104e-07, "epoch": 18.46992924528302, "percentage": 92.35, "elapsed_time": "1:00:28", "remaining_time": "0:05:00", "throughput": 5633.94, "total_tokens": 20441872} {"current_steps": 31330, "total_steps": 33920, "loss": 0.3027, "lr": 1.766864891133352e-07, "epoch": 18.472877358490567, "percentage": 92.36, "elapsed_time": "1:00:28", "remaining_time": "0:04:59", "throughput": 5634.0, "total_tokens": 20445072} {"current_steps": 31335, "total_steps": 33920, "loss": 0.3749, "lr": 1.7600924861351843e-07, "epoch": 18.475825471698112, "percentage": 92.38, "elapsed_time": "1:00:29", "remaining_time": "0:04:59", "throughput": 5634.27, "total_tokens": 20451920} {"current_steps": 31340, "total_steps": 33920, "loss": 0.2864, "lr": 1.7533328528604398e-07, "epoch": 18.47877358490566, "percentage": 92.39, "elapsed_time": "1:00:30", "remaining_time": "0:04:58", "throughput": 5634.45, "total_tokens": 20456656} {"current_steps": 31345, "total_steps": 33920, "loss": 0.2848, "lr": 1.746585993098754e-07, "epoch": 18.48172169811321, "percentage": 92.41, "elapsed_time": "1:00:31", "remaining_time": "0:04:58", "throughput": 5634.39, "total_tokens": 20459600} {"current_steps": 31350, "total_steps": 33920, "loss": 0.2667, "lr": 1.7398519086363864e-07, "epoch": 18.484669811320753, "percentage": 92.42, "elapsed_time": "1:00:31", "remaining_time": "0:04:57", "throughput": 5634.44, "total_tokens": 20462768} {"current_steps": 31355, "total_steps": 33920, "loss": 0.2421, "lr": 1.733130601256211e-07, "epoch": 18.4876179245283, "percentage": 92.44, "elapsed_time": "1:00:32", "remaining_time": "0:04:57", "throughput": 5634.4, "total_tokens": 20465488} {"current_steps": 31360, "total_steps": 33920, "loss": 0.5042, "lr": 1.7264220727377323e-07, "epoch": 18.49056603773585, "percentage": 92.45, "elapsed_time": "1:00:32", "remaining_time": "0:04:56", "throughput": 5634.49, "total_tokens": 20469264} {"current_steps": 31365, "total_steps": 33920, "loss": 0.2789, "lr": 1.7197263248570517e-07, "epoch": 18.493514150943398, "percentage": 92.47, "elapsed_time": "1:00:33", "remaining_time": "0:04:55", "throughput": 5634.47, "total_tokens": 20472176} {"current_steps": 31370, "total_steps": 33920, "loss": 0.3625, "lr": 1.7130433593869124e-07, "epoch": 18.496462264150942, "percentage": 92.48, "elapsed_time": "1:00:33", "remaining_time": "0:04:55", "throughput": 5634.59, "total_tokens": 20476048} {"current_steps": 31375, "total_steps": 33920, "loss": 0.2588, "lr": 1.706373178096643e-07, "epoch": 18.49941037735849, "percentage": 92.5, "elapsed_time": "1:00:34", "remaining_time": "0:04:54", "throughput": 5634.67, "total_tokens": 20479888} {"current_steps": 31380, "total_steps": 33920, "loss": 0.3334, "lr": 1.6997157827522092e-07, "epoch": 18.50235849056604, "percentage": 92.51, "elapsed_time": "1:00:35", "remaining_time": "0:04:54", "throughput": 5634.63, "total_tokens": 20482896} {"current_steps": 31385, "total_steps": 33920, "loss": 0.2593, "lr": 1.6930711751161843e-07, "epoch": 18.505306603773583, "percentage": 92.53, "elapsed_time": "1:00:35", "remaining_time": "0:04:53", "throughput": 5634.72, "total_tokens": 20486352} {"current_steps": 31390, "total_steps": 33920, "loss": 0.2878, "lr": 1.6864393569477556e-07, "epoch": 18.50825471698113, "percentage": 92.54, "elapsed_time": "1:00:36", "remaining_time": "0:04:53", "throughput": 5634.77, "total_tokens": 20489456} {"current_steps": 31395, "total_steps": 33920, "loss": 0.2706, "lr": 1.6798203300027295e-07, "epoch": 18.51120283018868, "percentage": 92.56, "elapsed_time": "1:00:36", "remaining_time": "0:04:52", "throughput": 5634.98, "total_tokens": 20493744} {"current_steps": 31400, "total_steps": 33920, "loss": 0.4022, "lr": 1.6732140960335152e-07, "epoch": 18.514150943396228, "percentage": 92.57, "elapsed_time": "1:00:37", "remaining_time": "0:04:51", "throughput": 5634.85, "total_tokens": 20496400} {"current_steps": 31405, "total_steps": 33920, "loss": 0.411, "lr": 1.666620656789153e-07, "epoch": 18.517099056603772, "percentage": 92.59, "elapsed_time": "1:00:37", "remaining_time": "0:04:51", "throughput": 5634.72, "total_tokens": 20498768} {"current_steps": 31410, "total_steps": 33920, "loss": 0.2382, "lr": 1.660040014015274e-07, "epoch": 18.52004716981132, "percentage": 92.6, "elapsed_time": "1:00:38", "remaining_time": "0:04:50", "throughput": 5634.7, "total_tokens": 20501584} {"current_steps": 31415, "total_steps": 33920, "loss": 0.1969, "lr": 1.6534721694541344e-07, "epoch": 18.52299528301887, "percentage": 92.61, "elapsed_time": "1:00:38", "remaining_time": "0:04:50", "throughput": 5634.63, "total_tokens": 20504144} {"current_steps": 31420, "total_steps": 33920, "loss": 0.3683, "lr": 1.6469171248445993e-07, "epoch": 18.525943396226417, "percentage": 92.63, "elapsed_time": "1:00:39", "remaining_time": "0:04:49", "throughput": 5634.73, "total_tokens": 20507728} {"current_steps": 31425, "total_steps": 33920, "loss": 0.2864, "lr": 1.6403748819221464e-07, "epoch": 18.52889150943396, "percentage": 92.64, "elapsed_time": "1:00:40", "remaining_time": "0:04:49", "throughput": 5634.88, "total_tokens": 20511472} {"current_steps": 31430, "total_steps": 33920, "loss": 0.2558, "lr": 1.6338454424188632e-07, "epoch": 18.53183962264151, "percentage": 92.66, "elapsed_time": "1:00:40", "remaining_time": "0:04:48", "throughput": 5634.88, "total_tokens": 20514448} {"current_steps": 31435, "total_steps": 33920, "loss": 0.3448, "lr": 1.6273288080634442e-07, "epoch": 18.534787735849058, "percentage": 92.67, "elapsed_time": "1:00:41", "remaining_time": "0:04:47", "throughput": 5634.93, "total_tokens": 20517584} {"current_steps": 31440, "total_steps": 33920, "loss": 0.3152, "lr": 1.6208249805811982e-07, "epoch": 18.537735849056602, "percentage": 92.69, "elapsed_time": "1:00:41", "remaining_time": "0:04:47", "throughput": 5635.09, "total_tokens": 20521456} {"current_steps": 31445, "total_steps": 33920, "loss": 0.1984, "lr": 1.6143339616940423e-07, "epoch": 18.54068396226415, "percentage": 92.7, "elapsed_time": "1:00:42", "remaining_time": "0:04:46", "throughput": 5635.09, "total_tokens": 20524336} {"current_steps": 31450, "total_steps": 33920, "loss": 0.2552, "lr": 1.6078557531205018e-07, "epoch": 18.5436320754717, "percentage": 92.72, "elapsed_time": "1:00:42", "remaining_time": "0:04:46", "throughput": 5635.17, "total_tokens": 20527856} {"current_steps": 31455, "total_steps": 33920, "loss": 0.3231, "lr": 1.601390356575705e-07, "epoch": 18.546580188679247, "percentage": 92.73, "elapsed_time": "1:00:43", "remaining_time": "0:04:45", "throughput": 5635.32, "total_tokens": 20532080} {"current_steps": 31460, "total_steps": 33920, "loss": 0.3175, "lr": 1.5949377737713988e-07, "epoch": 18.54952830188679, "percentage": 92.75, "elapsed_time": "1:00:44", "remaining_time": "0:04:44", "throughput": 5635.53, "total_tokens": 20536560} {"current_steps": 31465, "total_steps": 33920, "loss": 0.273, "lr": 1.5884980064159338e-07, "epoch": 18.55247641509434, "percentage": 92.76, "elapsed_time": "1:00:44", "remaining_time": "0:04:44", "throughput": 5635.46, "total_tokens": 20539472} {"current_steps": 31470, "total_steps": 33920, "loss": 0.3347, "lr": 1.5820710562142627e-07, "epoch": 18.555424528301888, "percentage": 92.78, "elapsed_time": "1:00:45", "remaining_time": "0:04:43", "throughput": 5635.58, "total_tokens": 20543728} {"current_steps": 31475, "total_steps": 33920, "loss": 0.325, "lr": 1.575656924867952e-07, "epoch": 18.558372641509433, "percentage": 92.79, "elapsed_time": "1:00:45", "remaining_time": "0:04:43", "throughput": 5635.66, "total_tokens": 20547248} {"current_steps": 31480, "total_steps": 33920, "loss": 0.3612, "lr": 1.5692556140751658e-07, "epoch": 18.56132075471698, "percentage": 92.81, "elapsed_time": "1:00:46", "remaining_time": "0:04:42", "throughput": 5635.76, "total_tokens": 20550608} {"current_steps": 31485, "total_steps": 33920, "loss": 0.2816, "lr": 1.5628671255306706e-07, "epoch": 18.56426886792453, "percentage": 92.82, "elapsed_time": "1:00:47", "remaining_time": "0:04:42", "throughput": 5635.74, "total_tokens": 20553744} {"current_steps": 31490, "total_steps": 33920, "loss": 0.2924, "lr": 1.556491460925863e-07, "epoch": 18.567216981132077, "percentage": 92.84, "elapsed_time": "1:00:47", "remaining_time": "0:04:41", "throughput": 5635.57, "total_tokens": 20556016} {"current_steps": 31495, "total_steps": 33920, "loss": 0.2443, "lr": 1.550128621948721e-07, "epoch": 18.57016509433962, "percentage": 92.85, "elapsed_time": "1:00:48", "remaining_time": "0:04:40", "throughput": 5635.54, "total_tokens": 20559184} {"current_steps": 31500, "total_steps": 33920, "loss": 0.3123, "lr": 1.5437786102838413e-07, "epoch": 18.57311320754717, "percentage": 92.87, "elapsed_time": "1:00:48", "remaining_time": "0:04:40", "throughput": 5635.48, "total_tokens": 20561904} {"current_steps": 31505, "total_steps": 33920, "loss": 0.3126, "lr": 1.5374414276124017e-07, "epoch": 18.576061320754718, "percentage": 92.88, "elapsed_time": "1:00:49", "remaining_time": "0:04:39", "throughput": 5635.65, "total_tokens": 20566448} {"current_steps": 31510, "total_steps": 33920, "loss": 0.2926, "lr": 1.5311170756122095e-07, "epoch": 18.579009433962263, "percentage": 92.9, "elapsed_time": "1:00:49", "remaining_time": "0:04:39", "throughput": 5635.55, "total_tokens": 20568880} {"current_steps": 31515, "total_steps": 33920, "loss": 0.3251, "lr": 1.5248055559576647e-07, "epoch": 18.58195754716981, "percentage": 92.91, "elapsed_time": "1:00:50", "remaining_time": "0:04:38", "throughput": 5635.55, "total_tokens": 20571888} {"current_steps": 31520, "total_steps": 33920, "loss": 0.4509, "lr": 1.5185068703197526e-07, "epoch": 18.58490566037736, "percentage": 92.92, "elapsed_time": "1:00:50", "remaining_time": "0:04:37", "throughput": 5635.58, "total_tokens": 20574768} {"current_steps": 31525, "total_steps": 33920, "loss": 0.2427, "lr": 1.5122210203661004e-07, "epoch": 18.587853773584907, "percentage": 92.94, "elapsed_time": "1:00:51", "remaining_time": "0:04:37", "throughput": 5635.6, "total_tokens": 20578032} {"current_steps": 31530, "total_steps": 33920, "loss": 0.3167, "lr": 1.505948007760899e-07, "epoch": 18.590801886792452, "percentage": 92.95, "elapsed_time": "1:00:51", "remaining_time": "0:04:36", "throughput": 5635.45, "total_tokens": 20580208} {"current_steps": 31535, "total_steps": 33920, "loss": 0.4487, "lr": 1.4996878341649647e-07, "epoch": 18.59375, "percentage": 92.97, "elapsed_time": "1:00:52", "remaining_time": "0:04:36", "throughput": 5635.44, "total_tokens": 20583024} {"current_steps": 31540, "total_steps": 33920, "loss": 0.3554, "lr": 1.493440501235699e-07, "epoch": 18.596698113207548, "percentage": 92.98, "elapsed_time": "1:00:52", "remaining_time": "0:04:35", "throughput": 5635.36, "total_tokens": 20585744} {"current_steps": 31545, "total_steps": 33920, "loss": 0.308, "lr": 1.487206010627118e-07, "epoch": 18.599646226415093, "percentage": 93.0, "elapsed_time": "1:00:53", "remaining_time": "0:04:35", "throughput": 5635.48, "total_tokens": 20589296} {"current_steps": 31550, "total_steps": 33920, "loss": 0.3127, "lr": 1.4809843639898124e-07, "epoch": 18.60259433962264, "percentage": 93.01, "elapsed_time": "1:00:54", "remaining_time": "0:04:34", "throughput": 5635.52, "total_tokens": 20592400} {"current_steps": 31555, "total_steps": 33920, "loss": 0.1978, "lr": 1.4747755629710093e-07, "epoch": 18.60554245283019, "percentage": 93.03, "elapsed_time": "1:00:54", "remaining_time": "0:04:33", "throughput": 5635.48, "total_tokens": 20595024} {"current_steps": 31560, "total_steps": 33920, "loss": 0.2828, "lr": 1.4685796092145045e-07, "epoch": 18.608490566037737, "percentage": 93.04, "elapsed_time": "1:00:55", "remaining_time": "0:04:33", "throughput": 5635.61, "total_tokens": 20598544} {"current_steps": 31565, "total_steps": 33920, "loss": 0.3113, "lr": 1.4623965043607135e-07, "epoch": 18.611438679245282, "percentage": 93.06, "elapsed_time": "1:00:55", "remaining_time": "0:04:32", "throughput": 5635.64, "total_tokens": 20601456} {"current_steps": 31570, "total_steps": 33920, "loss": 0.3825, "lr": 1.4562262500466273e-07, "epoch": 18.61438679245283, "percentage": 93.07, "elapsed_time": "1:00:56", "remaining_time": "0:04:32", "throughput": 5635.67, "total_tokens": 20604336} {"current_steps": 31575, "total_steps": 33920, "loss": 0.2636, "lr": 1.4500688479058556e-07, "epoch": 18.61733490566038, "percentage": 93.09, "elapsed_time": "1:00:56", "remaining_time": "0:04:31", "throughput": 5635.58, "total_tokens": 20607184} {"current_steps": 31580, "total_steps": 33920, "loss": 0.2943, "lr": 1.4439242995685943e-07, "epoch": 18.620283018867923, "percentage": 93.1, "elapsed_time": "1:00:57", "remaining_time": "0:04:30", "throughput": 5635.7, "total_tokens": 20610896} {"current_steps": 31585, "total_steps": 33920, "loss": 0.3603, "lr": 1.4377926066616364e-07, "epoch": 18.62323113207547, "percentage": 93.12, "elapsed_time": "1:00:57", "remaining_time": "0:04:30", "throughput": 5635.76, "total_tokens": 20613936} {"current_steps": 31590, "total_steps": 33920, "loss": 0.3972, "lr": 1.4316737708083783e-07, "epoch": 18.62617924528302, "percentage": 93.13, "elapsed_time": "1:00:58", "remaining_time": "0:04:29", "throughput": 5635.78, "total_tokens": 20617136} {"current_steps": 31595, "total_steps": 33920, "loss": 0.3487, "lr": 1.4255677936288127e-07, "epoch": 18.629127358490567, "percentage": 93.15, "elapsed_time": "1:00:58", "remaining_time": "0:04:29", "throughput": 5635.85, "total_tokens": 20620304} {"current_steps": 31600, "total_steps": 33920, "loss": 0.3254, "lr": 1.4194746767395184e-07, "epoch": 18.632075471698112, "percentage": 93.16, "elapsed_time": "1:00:59", "remaining_time": "0:04:28", "throughput": 5635.89, "total_tokens": 20623728} {"current_steps": 31605, "total_steps": 33920, "loss": 0.2835, "lr": 1.4133944217536722e-07, "epoch": 18.63502358490566, "percentage": 93.18, "elapsed_time": "1:00:59", "remaining_time": "0:04:28", "throughput": 5635.89, "total_tokens": 20627088} {"current_steps": 31610, "total_steps": 33920, "loss": 0.2135, "lr": 1.4073270302810471e-07, "epoch": 18.63797169811321, "percentage": 93.19, "elapsed_time": "1:01:00", "remaining_time": "0:04:27", "throughput": 5635.95, "total_tokens": 20631088} {"current_steps": 31615, "total_steps": 33920, "loss": 0.2733, "lr": 1.4012725039280084e-07, "epoch": 18.640919811320753, "percentage": 93.2, "elapsed_time": "1:01:01", "remaining_time": "0:04:26", "throughput": 5635.91, "total_tokens": 20634032} {"current_steps": 31620, "total_steps": 33920, "loss": 0.3314, "lr": 1.3952308442975292e-07, "epoch": 18.6438679245283, "percentage": 93.22, "elapsed_time": "1:01:01", "remaining_time": "0:04:26", "throughput": 5635.91, "total_tokens": 20637104} {"current_steps": 31625, "total_steps": 33920, "loss": 0.2342, "lr": 1.3892020529891637e-07, "epoch": 18.64681603773585, "percentage": 93.23, "elapsed_time": "1:01:02", "remaining_time": "0:04:25", "throughput": 5635.92, "total_tokens": 20640368} {"current_steps": 31630, "total_steps": 33920, "loss": 0.3761, "lr": 1.3831861315990514e-07, "epoch": 18.649764150943398, "percentage": 93.25, "elapsed_time": "1:01:02", "remaining_time": "0:04:25", "throughput": 5635.87, "total_tokens": 20643056} {"current_steps": 31635, "total_steps": 33920, "loss": 0.3219, "lr": 1.377183081719935e-07, "epoch": 18.652712264150942, "percentage": 93.26, "elapsed_time": "1:01:03", "remaining_time": "0:04:24", "throughput": 5636.03, "total_tokens": 20647376} {"current_steps": 31640, "total_steps": 33920, "loss": 0.2729, "lr": 1.3711929049411544e-07, "epoch": 18.65566037735849, "percentage": 93.28, "elapsed_time": "1:01:04", "remaining_time": "0:04:24", "throughput": 5636.11, "total_tokens": 20650864} {"current_steps": 31645, "total_steps": 33920, "loss": 0.3813, "lr": 1.365215602848624e-07, "epoch": 18.65860849056604, "percentage": 93.29, "elapsed_time": "1:01:04", "remaining_time": "0:04:23", "throughput": 5636.1, "total_tokens": 20653712} {"current_steps": 31650, "total_steps": 33920, "loss": 0.3763, "lr": 1.3592511770248727e-07, "epoch": 18.661556603773583, "percentage": 93.31, "elapsed_time": "1:01:05", "remaining_time": "0:04:22", "throughput": 5636.09, "total_tokens": 20656528} {"current_steps": 31655, "total_steps": 33920, "loss": 0.2725, "lr": 1.3532996290490041e-07, "epoch": 18.66450471698113, "percentage": 93.32, "elapsed_time": "1:01:05", "remaining_time": "0:04:22", "throughput": 5636.04, "total_tokens": 20659440} {"current_steps": 31660, "total_steps": 33920, "loss": 0.2856, "lr": 1.347360960496713e-07, "epoch": 18.66745283018868, "percentage": 93.34, "elapsed_time": "1:01:06", "remaining_time": "0:04:21", "throughput": 5635.92, "total_tokens": 20662096} {"current_steps": 31665, "total_steps": 33920, "loss": 0.289, "lr": 1.3414351729402862e-07, "epoch": 18.670400943396228, "percentage": 93.35, "elapsed_time": "1:01:06", "remaining_time": "0:04:21", "throughput": 5635.95, "total_tokens": 20665808} {"current_steps": 31670, "total_steps": 33920, "loss": 0.3186, "lr": 1.3355222679486025e-07, "epoch": 18.673349056603772, "percentage": 93.37, "elapsed_time": "1:01:07", "remaining_time": "0:04:20", "throughput": 5635.95, "total_tokens": 20668848} {"current_steps": 31675, "total_steps": 33920, "loss": 0.2851, "lr": 1.3296222470871367e-07, "epoch": 18.67629716981132, "percentage": 93.38, "elapsed_time": "1:01:07", "remaining_time": "0:04:19", "throughput": 5635.9, "total_tokens": 20671760} {"current_steps": 31680, "total_steps": 33920, "loss": 0.2815, "lr": 1.3237351119179287e-07, "epoch": 18.67924528301887, "percentage": 93.4, "elapsed_time": "1:01:08", "remaining_time": "0:04:19", "throughput": 5635.95, "total_tokens": 20675472} {"current_steps": 31685, "total_steps": 33920, "loss": 0.2789, "lr": 1.3178608639996425e-07, "epoch": 18.682193396226417, "percentage": 93.41, "elapsed_time": "1:01:08", "remaining_time": "0:04:18", "throughput": 5635.91, "total_tokens": 20678128} {"current_steps": 31690, "total_steps": 33920, "loss": 0.3361, "lr": 1.3119995048874957e-07, "epoch": 18.68514150943396, "percentage": 93.43, "elapsed_time": "1:01:09", "remaining_time": "0:04:18", "throughput": 5635.98, "total_tokens": 20681360} {"current_steps": 31695, "total_steps": 33920, "loss": 0.3677, "lr": 1.3061510361333186e-07, "epoch": 18.68808962264151, "percentage": 93.44, "elapsed_time": "1:01:10", "remaining_time": "0:04:17", "throughput": 5636.04, "total_tokens": 20684816} {"current_steps": 31700, "total_steps": 33920, "loss": 0.2802, "lr": 1.3003154592855116e-07, "epoch": 18.691037735849058, "percentage": 93.46, "elapsed_time": "1:01:10", "remaining_time": "0:04:17", "throughput": 5636.22, "total_tokens": 20689232} {"current_steps": 31705, "total_steps": 33920, "loss": 0.2515, "lr": 1.2944927758890668e-07, "epoch": 18.693985849056602, "percentage": 93.47, "elapsed_time": "1:01:11", "remaining_time": "0:04:16", "throughput": 5636.09, "total_tokens": 20691664} {"current_steps": 31710, "total_steps": 33920, "loss": 0.2726, "lr": 1.2886829874855733e-07, "epoch": 18.69693396226415, "percentage": 93.48, "elapsed_time": "1:01:11", "remaining_time": "0:04:15", "throughput": 5636.14, "total_tokens": 20694896} {"current_steps": 31715, "total_steps": 33920, "loss": 0.2433, "lr": 1.2828860956131894e-07, "epoch": 18.6998820754717, "percentage": 93.5, "elapsed_time": "1:01:12", "remaining_time": "0:04:15", "throughput": 5636.28, "total_tokens": 20699312} {"current_steps": 31720, "total_steps": 33920, "loss": 0.2558, "lr": 1.2771021018066765e-07, "epoch": 18.702830188679247, "percentage": 93.51, "elapsed_time": "1:01:13", "remaining_time": "0:04:14", "throughput": 5636.38, "total_tokens": 20703056} {"current_steps": 31725, "total_steps": 33920, "loss": 0.2757, "lr": 1.271331007597365e-07, "epoch": 18.70577830188679, "percentage": 93.53, "elapsed_time": "1:01:13", "remaining_time": "0:04:14", "throughput": 5636.29, "total_tokens": 20705520} {"current_steps": 31730, "total_steps": 33920, "loss": 0.3836, "lr": 1.2655728145131774e-07, "epoch": 18.70872641509434, "percentage": 93.54, "elapsed_time": "1:01:14", "remaining_time": "0:04:13", "throughput": 5636.23, "total_tokens": 20708784} {"current_steps": 31735, "total_steps": 33920, "loss": 0.3546, "lr": 1.2598275240786105e-07, "epoch": 18.711674528301888, "percentage": 93.56, "elapsed_time": "1:01:14", "remaining_time": "0:04:13", "throughput": 5636.28, "total_tokens": 20712176} {"current_steps": 31740, "total_steps": 33920, "loss": 0.3474, "lr": 1.254095137814776e-07, "epoch": 18.714622641509433, "percentage": 93.57, "elapsed_time": "1:01:15", "remaining_time": "0:04:12", "throughput": 5636.25, "total_tokens": 20715152} {"current_steps": 31745, "total_steps": 33920, "loss": 0.2912, "lr": 1.2483756572393368e-07, "epoch": 18.71757075471698, "percentage": 93.59, "elapsed_time": "1:01:15", "remaining_time": "0:04:11", "throughput": 5636.31, "total_tokens": 20718480} {"current_steps": 31750, "total_steps": 33920, "loss": 0.2832, "lr": 1.242669083866549e-07, "epoch": 18.72051886792453, "percentage": 93.6, "elapsed_time": "1:01:16", "remaining_time": "0:04:11", "throughput": 5636.21, "total_tokens": 20720944} {"current_steps": 31755, "total_steps": 33920, "loss": 0.3728, "lr": 1.2369754192072537e-07, "epoch": 18.723466981132077, "percentage": 93.62, "elapsed_time": "1:01:16", "remaining_time": "0:04:10", "throughput": 5636.2, "total_tokens": 20723856} {"current_steps": 31760, "total_steps": 33920, "loss": 0.3143, "lr": 1.231294664768873e-07, "epoch": 18.72641509433962, "percentage": 93.63, "elapsed_time": "1:01:17", "remaining_time": "0:04:10", "throughput": 5636.19, "total_tokens": 20726928} {"current_steps": 31765, "total_steps": 33920, "loss": 0.3305, "lr": 1.225626822055409e-07, "epoch": 18.72936320754717, "percentage": 93.65, "elapsed_time": "1:01:18", "remaining_time": "0:04:09", "throughput": 5636.2, "total_tokens": 20730192} {"current_steps": 31770, "total_steps": 33920, "loss": 0.2117, "lr": 1.2199718925674508e-07, "epoch": 18.732311320754718, "percentage": 93.66, "elapsed_time": "1:01:18", "remaining_time": "0:04:08", "throughput": 5636.37, "total_tokens": 20735376} {"current_steps": 31775, "total_steps": 33920, "loss": 0.2889, "lr": 1.2143298778021616e-07, "epoch": 18.735259433962263, "percentage": 93.68, "elapsed_time": "1:01:19", "remaining_time": "0:04:08", "throughput": 5636.54, "total_tokens": 20739888} {"current_steps": 31780, "total_steps": 33920, "loss": 0.334, "lr": 1.2087007792532967e-07, "epoch": 18.73820754716981, "percentage": 93.69, "elapsed_time": "1:01:20", "remaining_time": "0:04:07", "throughput": 5636.5, "total_tokens": 20742640} {"current_steps": 31785, "total_steps": 33920, "loss": 0.2551, "lr": 1.203084598411175e-07, "epoch": 18.74115566037736, "percentage": 93.71, "elapsed_time": "1:01:20", "remaining_time": "0:04:07", "throughput": 5636.55, "total_tokens": 20745808} {"current_steps": 31790, "total_steps": 33920, "loss": 0.2814, "lr": 1.1974813367627124e-07, "epoch": 18.744103773584907, "percentage": 93.72, "elapsed_time": "1:01:21", "remaining_time": "0:04:06", "throughput": 5636.51, "total_tokens": 20748592} {"current_steps": 31795, "total_steps": 33920, "loss": 0.3338, "lr": 1.1918909957913949e-07, "epoch": 18.747051886792452, "percentage": 93.74, "elapsed_time": "1:01:21", "remaining_time": "0:04:06", "throughput": 5636.62, "total_tokens": 20752048} {"current_steps": 31800, "total_steps": 33920, "loss": 0.3979, "lr": 1.1863135769772827e-07, "epoch": 18.75, "percentage": 93.75, "elapsed_time": "1:01:22", "remaining_time": "0:04:05", "throughput": 5636.91, "total_tokens": 20758544} {"current_steps": 31805, "total_steps": 33920, "loss": 0.2111, "lr": 1.1807490817970279e-07, "epoch": 18.752948113207548, "percentage": 93.76, "elapsed_time": "1:01:23", "remaining_time": "0:04:04", "throughput": 5637.04, "total_tokens": 20762672} {"current_steps": 31810, "total_steps": 33920, "loss": 0.2503, "lr": 1.1751975117238578e-07, "epoch": 18.755896226415093, "percentage": 93.78, "elapsed_time": "1:01:23", "remaining_time": "0:04:04", "throughput": 5637.04, "total_tokens": 20765776} {"current_steps": 31815, "total_steps": 33920, "loss": 0.2976, "lr": 1.1696588682275633e-07, "epoch": 18.75884433962264, "percentage": 93.79, "elapsed_time": "1:01:24", "remaining_time": "0:04:03", "throughput": 5636.97, "total_tokens": 20768528} {"current_steps": 31820, "total_steps": 33920, "loss": 0.3963, "lr": 1.1641331527745325e-07, "epoch": 18.76179245283019, "percentage": 93.81, "elapsed_time": "1:01:25", "remaining_time": "0:04:03", "throughput": 5637.23, "total_tokens": 20775248} {"current_steps": 31825, "total_steps": 33920, "loss": 0.2465, "lr": 1.1586203668277229e-07, "epoch": 18.764740566037737, "percentage": 93.82, "elapsed_time": "1:01:25", "remaining_time": "0:04:02", "throughput": 5637.31, "total_tokens": 20778736} {"current_steps": 31830, "total_steps": 33920, "loss": 0.3572, "lr": 1.1531205118466615e-07, "epoch": 18.767688679245282, "percentage": 93.84, "elapsed_time": "1:01:26", "remaining_time": "0:04:02", "throughput": 5637.42, "total_tokens": 20782128} {"current_steps": 31835, "total_steps": 33920, "loss": 0.3461, "lr": 1.1476335892874669e-07, "epoch": 18.77063679245283, "percentage": 93.85, "elapsed_time": "1:01:27", "remaining_time": "0:04:01", "throughput": 5637.43, "total_tokens": 20785424} {"current_steps": 31840, "total_steps": 33920, "loss": 0.4265, "lr": 1.1421596006028157e-07, "epoch": 18.77358490566038, "percentage": 93.87, "elapsed_time": "1:01:27", "remaining_time": "0:04:00", "throughput": 5637.51, "total_tokens": 20788976} {"current_steps": 31845, "total_steps": 33920, "loss": 0.2755, "lr": 1.1366985472419823e-07, "epoch": 18.776533018867923, "percentage": 93.88, "elapsed_time": "1:01:28", "remaining_time": "0:04:00", "throughput": 5637.45, "total_tokens": 20791536} {"current_steps": 31850, "total_steps": 33920, "loss": 0.2372, "lr": 1.1312504306507987e-07, "epoch": 18.77948113207547, "percentage": 93.9, "elapsed_time": "1:01:28", "remaining_time": "0:03:59", "throughput": 5637.63, "total_tokens": 20795568} {"current_steps": 31855, "total_steps": 33920, "loss": 0.3405, "lr": 1.1258152522716725e-07, "epoch": 18.78242924528302, "percentage": 93.91, "elapsed_time": "1:01:29", "remaining_time": "0:03:59", "throughput": 5637.65, "total_tokens": 20798832} {"current_steps": 31860, "total_steps": 33920, "loss": 0.2894, "lr": 1.1203930135435914e-07, "epoch": 18.785377358490567, "percentage": 93.93, "elapsed_time": "1:01:29", "remaining_time": "0:03:58", "throughput": 5637.71, "total_tokens": 20802352} {"current_steps": 31865, "total_steps": 33920, "loss": 0.3813, "lr": 1.1149837159021238e-07, "epoch": 18.788325471698112, "percentage": 93.94, "elapsed_time": "1:01:30", "remaining_time": "0:03:57", "throughput": 5637.86, "total_tokens": 20806160} {"current_steps": 31870, "total_steps": 33920, "loss": 0.2949, "lr": 1.1095873607793961e-07, "epoch": 18.79127358490566, "percentage": 93.96, "elapsed_time": "1:01:31", "remaining_time": "0:03:57", "throughput": 5637.87, "total_tokens": 20809424} {"current_steps": 31875, "total_steps": 33920, "loss": 0.3164, "lr": 1.1042039496041212e-07, "epoch": 18.79422169811321, "percentage": 93.97, "elapsed_time": "1:01:31", "remaining_time": "0:03:56", "throughput": 5637.9, "total_tokens": 20812624} {"current_steps": 31880, "total_steps": 33920, "loss": 0.2514, "lr": 1.0988334838015812e-07, "epoch": 18.797169811320753, "percentage": 93.99, "elapsed_time": "1:01:32", "remaining_time": "0:03:56", "throughput": 5637.94, "total_tokens": 20815728} {"current_steps": 31885, "total_steps": 33920, "loss": 0.3727, "lr": 1.0934759647936333e-07, "epoch": 18.8001179245283, "percentage": 94.0, "elapsed_time": "1:01:32", "remaining_time": "0:03:55", "throughput": 5638.04, "total_tokens": 20819664} {"current_steps": 31890, "total_steps": 33920, "loss": 0.2504, "lr": 1.0881313939986926e-07, "epoch": 18.80306603773585, "percentage": 94.02, "elapsed_time": "1:01:33", "remaining_time": "0:03:55", "throughput": 5638.16, "total_tokens": 20823280} {"current_steps": 31895, "total_steps": 33920, "loss": 0.2794, "lr": 1.0827997728317662e-07, "epoch": 18.806014150943398, "percentage": 94.03, "elapsed_time": "1:01:33", "remaining_time": "0:03:54", "throughput": 5638.05, "total_tokens": 20825840} {"current_steps": 31900, "total_steps": 33920, "loss": 0.3608, "lr": 1.0774811027044196e-07, "epoch": 18.808962264150942, "percentage": 94.04, "elapsed_time": "1:01:34", "remaining_time": "0:03:53", "throughput": 5638.03, "total_tokens": 20828816} {"current_steps": 31905, "total_steps": 33920, "loss": 0.224, "lr": 1.0721753850247984e-07, "epoch": 18.81191037735849, "percentage": 94.06, "elapsed_time": "1:01:34", "remaining_time": "0:03:53", "throughput": 5637.91, "total_tokens": 20831280} {"current_steps": 31910, "total_steps": 33920, "loss": 0.1971, "lr": 1.0668826211976124e-07, "epoch": 18.81485849056604, "percentage": 94.07, "elapsed_time": "1:01:35", "remaining_time": "0:03:52", "throughput": 5637.94, "total_tokens": 20834256} {"current_steps": 31915, "total_steps": 33920, "loss": 0.2567, "lr": 1.0616028126241407e-07, "epoch": 18.817806603773583, "percentage": 94.09, "elapsed_time": "1:01:35", "remaining_time": "0:03:52", "throughput": 5637.99, "total_tokens": 20837264} {"current_steps": 31920, "total_steps": 33920, "loss": 0.2677, "lr": 1.0563359607022372e-07, "epoch": 18.82075471698113, "percentage": 94.1, "elapsed_time": "1:01:36", "remaining_time": "0:03:51", "throughput": 5637.98, "total_tokens": 20840208} {"current_steps": 31925, "total_steps": 33920, "loss": 0.2378, "lr": 1.05108206682632e-07, "epoch": 18.82370283018868, "percentage": 94.12, "elapsed_time": "1:01:37", "remaining_time": "0:03:51", "throughput": 5638.06, "total_tokens": 20844336} {"current_steps": 31930, "total_steps": 33920, "loss": 0.2943, "lr": 1.0458411323873874e-07, "epoch": 18.826650943396228, "percentage": 94.13, "elapsed_time": "1:01:37", "remaining_time": "0:03:50", "throughput": 5638.11, "total_tokens": 20847728} {"current_steps": 31935, "total_steps": 33920, "loss": 0.2771, "lr": 1.0406131587729962e-07, "epoch": 18.829599056603772, "percentage": 94.15, "elapsed_time": "1:01:38", "remaining_time": "0:03:49", "throughput": 5638.18, "total_tokens": 20850928} {"current_steps": 31940, "total_steps": 33920, "loss": 0.3013, "lr": 1.035398147367278e-07, "epoch": 18.83254716981132, "percentage": 94.16, "elapsed_time": "1:01:38", "remaining_time": "0:03:49", "throughput": 5638.16, "total_tokens": 20853968} {"current_steps": 31945, "total_steps": 33920, "loss": 0.2883, "lr": 1.030196099550923e-07, "epoch": 18.83549528301887, "percentage": 94.18, "elapsed_time": "1:01:39", "remaining_time": "0:03:48", "throughput": 5638.32, "total_tokens": 20858064} {"current_steps": 31950, "total_steps": 33920, "loss": 0.2785, "lr": 1.0250070167011905e-07, "epoch": 18.838443396226417, "percentage": 94.19, "elapsed_time": "1:01:39", "remaining_time": "0:03:48", "throughput": 5638.16, "total_tokens": 20860208} {"current_steps": 31955, "total_steps": 33920, "loss": 0.2631, "lr": 1.0198309001919315e-07, "epoch": 18.84139150943396, "percentage": 94.21, "elapsed_time": "1:01:40", "remaining_time": "0:03:47", "throughput": 5638.07, "total_tokens": 20862864} {"current_steps": 31960, "total_steps": 33920, "loss": 0.3585, "lr": 1.0146677513935277e-07, "epoch": 18.84433962264151, "percentage": 94.22, "elapsed_time": "1:01:40", "remaining_time": "0:03:46", "throughput": 5638.08, "total_tokens": 20865968} {"current_steps": 31965, "total_steps": 33920, "loss": 0.275, "lr": 1.0095175716729578e-07, "epoch": 18.847287735849058, "percentage": 94.24, "elapsed_time": "1:01:41", "remaining_time": "0:03:46", "throughput": 5638.13, "total_tokens": 20869200} {"current_steps": 31970, "total_steps": 33920, "loss": 0.3183, "lr": 1.004380362393742e-07, "epoch": 18.850235849056602, "percentage": 94.25, "elapsed_time": "1:01:41", "remaining_time": "0:03:45", "throughput": 5638.08, "total_tokens": 20871888} {"current_steps": 31975, "total_steps": 33920, "loss": 0.3647, "lr": 9.99256124915987e-08, "epoch": 18.85318396226415, "percentage": 94.27, "elapsed_time": "1:01:42", "remaining_time": "0:03:45", "throughput": 5638.08, "total_tokens": 20874704} {"current_steps": 31980, "total_steps": 33920, "loss": 0.4206, "lr": 9.941448605963577e-08, "epoch": 18.8561320754717, "percentage": 94.28, "elapsed_time": "1:01:42", "remaining_time": "0:03:44", "throughput": 5638.18, "total_tokens": 20878160} {"current_steps": 31985, "total_steps": 33920, "loss": 0.2586, "lr": 9.890465707880715e-08, "epoch": 18.859080188679247, "percentage": 94.3, "elapsed_time": "1:01:43", "remaining_time": "0:03:44", "throughput": 5638.09, "total_tokens": 20880656} {"current_steps": 31990, "total_steps": 33920, "loss": 0.3039, "lr": 9.839612568409374e-08, "epoch": 18.86202830188679, "percentage": 94.31, "elapsed_time": "1:01:44", "remaining_time": "0:03:43", "throughput": 5638.09, "total_tokens": 20883760} {"current_steps": 31995, "total_steps": 33920, "loss": 0.2815, "lr": 9.788889201013119e-08, "epoch": 18.86497641509434, "percentage": 94.32, "elapsed_time": "1:01:44", "remaining_time": "0:03:42", "throughput": 5638.13, "total_tokens": 20886864} {"current_steps": 32000, "total_steps": 33920, "loss": 0.3522, "lr": 9.738295619121097e-08, "epoch": 18.867924528301888, "percentage": 94.34, "elapsed_time": "1:01:45", "remaining_time": "0:03:42", "throughput": 5638.12, "total_tokens": 20889552} {"current_steps": 32005, "total_steps": 33920, "loss": 0.2596, "lr": 9.687831836128203e-08, "epoch": 18.870872641509433, "percentage": 94.35, "elapsed_time": "1:01:45", "remaining_time": "0:03:41", "throughput": 5638.2, "total_tokens": 20893360} {"current_steps": 32010, "total_steps": 33920, "loss": 0.2454, "lr": 9.637497865395029e-08, "epoch": 18.87382075471698, "percentage": 94.37, "elapsed_time": "1:01:46", "remaining_time": "0:03:41", "throughput": 5638.2, "total_tokens": 20896208} {"current_steps": 32015, "total_steps": 33920, "loss": 0.3027, "lr": 9.587293720247526e-08, "epoch": 18.87676886792453, "percentage": 94.38, "elapsed_time": "1:01:46", "remaining_time": "0:03:40", "throughput": 5638.14, "total_tokens": 20898896} {"current_steps": 32020, "total_steps": 33920, "loss": 0.2769, "lr": 9.537219413977672e-08, "epoch": 18.879716981132077, "percentage": 94.4, "elapsed_time": "1:01:47", "remaining_time": "0:03:39", "throughput": 5638.25, "total_tokens": 20902704} {"current_steps": 32025, "total_steps": 33920, "loss": 0.2813, "lr": 9.487274959842696e-08, "epoch": 18.88266509433962, "percentage": 94.41, "elapsed_time": "1:01:47", "remaining_time": "0:03:39", "throughput": 5638.28, "total_tokens": 20905712} {"current_steps": 32030, "total_steps": 33920, "loss": 0.3012, "lr": 9.437460371065687e-08, "epoch": 18.88561320754717, "percentage": 94.43, "elapsed_time": "1:01:48", "remaining_time": "0:03:38", "throughput": 5638.16, "total_tokens": 20908176} {"current_steps": 32035, "total_steps": 33920, "loss": 0.2973, "lr": 9.387775660835263e-08, "epoch": 18.888561320754718, "percentage": 94.44, "elapsed_time": "1:01:48", "remaining_time": "0:03:38", "throughput": 5638.25, "total_tokens": 20911760} {"current_steps": 32040, "total_steps": 33920, "loss": 0.2477, "lr": 9.338220842305678e-08, "epoch": 18.891509433962263, "percentage": 94.46, "elapsed_time": "1:01:49", "remaining_time": "0:03:37", "throughput": 5638.18, "total_tokens": 20914256} {"current_steps": 32045, "total_steps": 33920, "loss": 0.2981, "lr": 9.288795928596661e-08, "epoch": 18.89445754716981, "percentage": 94.47, "elapsed_time": "1:01:49", "remaining_time": "0:03:37", "throughput": 5638.28, "total_tokens": 20917904} {"current_steps": 32050, "total_steps": 33920, "loss": 0.2732, "lr": 9.239500932793854e-08, "epoch": 18.89740566037736, "percentage": 94.49, "elapsed_time": "1:01:50", "remaining_time": "0:03:36", "throughput": 5638.48, "total_tokens": 20922288} {"current_steps": 32055, "total_steps": 33920, "loss": 0.4326, "lr": 9.190335867948263e-08, "epoch": 18.900353773584907, "percentage": 94.5, "elapsed_time": "1:01:51", "remaining_time": "0:03:35", "throughput": 5638.49, "total_tokens": 20925328} {"current_steps": 32060, "total_steps": 33920, "loss": 0.4076, "lr": 9.141300747076476e-08, "epoch": 18.903301886792452, "percentage": 94.52, "elapsed_time": "1:01:51", "remaining_time": "0:03:35", "throughput": 5638.55, "total_tokens": 20928432} {"current_steps": 32065, "total_steps": 33920, "loss": 0.2425, "lr": 9.092395583160773e-08, "epoch": 18.90625, "percentage": 94.53, "elapsed_time": "1:01:52", "remaining_time": "0:03:34", "throughput": 5638.66, "total_tokens": 20932496} {"current_steps": 32070, "total_steps": 33920, "loss": 0.1986, "lr": 9.043620389149021e-08, "epoch": 18.909198113207548, "percentage": 94.55, "elapsed_time": "1:01:52", "remaining_time": "0:03:34", "throughput": 5638.64, "total_tokens": 20935184} {"current_steps": 32075, "total_steps": 33920, "loss": 0.3418, "lr": 8.994975177954723e-08, "epoch": 18.912146226415093, "percentage": 94.56, "elapsed_time": "1:01:53", "remaining_time": "0:03:33", "throughput": 5638.7, "total_tokens": 20938288} {"current_steps": 32080, "total_steps": 33920, "loss": 0.3366, "lr": 8.946459962456855e-08, "epoch": 18.91509433962264, "percentage": 94.58, "elapsed_time": "1:01:53", "remaining_time": "0:03:33", "throughput": 5638.77, "total_tokens": 20941648} {"current_steps": 32085, "total_steps": 33920, "loss": 0.3754, "lr": 8.89807475550003e-08, "epoch": 18.91804245283019, "percentage": 94.59, "elapsed_time": "1:01:54", "remaining_time": "0:03:32", "throughput": 5638.88, "total_tokens": 20945008} {"current_steps": 32090, "total_steps": 33920, "loss": 0.3541, "lr": 8.849819569894447e-08, "epoch": 18.920990566037737, "percentage": 94.6, "elapsed_time": "1:01:54", "remaining_time": "0:03:31", "throughput": 5638.88, "total_tokens": 20947792} {"current_steps": 32095, "total_steps": 33920, "loss": 0.2469, "lr": 8.801694418415884e-08, "epoch": 18.923938679245282, "percentage": 94.62, "elapsed_time": "1:01:55", "remaining_time": "0:03:31", "throughput": 5638.87, "total_tokens": 20950576} {"current_steps": 32100, "total_steps": 33920, "loss": 0.3381, "lr": 8.753699313805708e-08, "epoch": 18.92688679245283, "percentage": 94.63, "elapsed_time": "1:01:55", "remaining_time": "0:03:30", "throughput": 5638.92, "total_tokens": 20953840} {"current_steps": 32105, "total_steps": 33920, "loss": 0.2294, "lr": 8.705834268770753e-08, "epoch": 18.92983490566038, "percentage": 94.65, "elapsed_time": "1:01:56", "remaining_time": "0:03:30", "throughput": 5638.9, "total_tokens": 20956592} {"current_steps": 32110, "total_steps": 33920, "loss": 0.3171, "lr": 8.65809929598349e-08, "epoch": 18.932783018867923, "percentage": 94.66, "elapsed_time": "1:01:56", "remaining_time": "0:03:29", "throughput": 5638.83, "total_tokens": 20959088} {"current_steps": 32115, "total_steps": 33920, "loss": 0.2669, "lr": 8.610494408082037e-08, "epoch": 18.93573113207547, "percentage": 94.68, "elapsed_time": "1:01:57", "remaining_time": "0:03:28", "throughput": 5638.93, "total_tokens": 20962576} {"current_steps": 32120, "total_steps": 33920, "loss": 0.2132, "lr": 8.563019617669977e-08, "epoch": 18.93867924528302, "percentage": 94.69, "elapsed_time": "1:01:58", "remaining_time": "0:03:28", "throughput": 5639.07, "total_tokens": 20966896} {"current_steps": 32125, "total_steps": 33920, "loss": 0.3379, "lr": 8.51567493731642e-08, "epoch": 18.941627358490567, "percentage": 94.71, "elapsed_time": "1:01:58", "remaining_time": "0:03:27", "throughput": 5639.13, "total_tokens": 20970608} {"current_steps": 32130, "total_steps": 33920, "loss": 0.2447, "lr": 8.468460379556176e-08, "epoch": 18.944575471698112, "percentage": 94.72, "elapsed_time": "1:01:59", "remaining_time": "0:03:27", "throughput": 5639.13, "total_tokens": 20973616} {"current_steps": 32135, "total_steps": 33920, "loss": 0.3532, "lr": 8.421375956889355e-08, "epoch": 18.94752358490566, "percentage": 94.74, "elapsed_time": "1:01:59", "remaining_time": "0:03:26", "throughput": 5639.09, "total_tokens": 20976272} {"current_steps": 32140, "total_steps": 33920, "loss": 0.2378, "lr": 8.374421681781819e-08, "epoch": 18.95047169811321, "percentage": 94.75, "elapsed_time": "1:02:00", "remaining_time": "0:03:26", "throughput": 5639.1, "total_tokens": 20979248} {"current_steps": 32145, "total_steps": 33920, "loss": 0.4016, "lr": 8.327597566665013e-08, "epoch": 18.953419811320753, "percentage": 94.77, "elapsed_time": "1:02:00", "remaining_time": "0:03:25", "throughput": 5639.09, "total_tokens": 20982448} {"current_steps": 32150, "total_steps": 33920, "loss": 0.4091, "lr": 8.280903623935688e-08, "epoch": 18.9563679245283, "percentage": 94.78, "elapsed_time": "1:02:01", "remaining_time": "0:03:24", "throughput": 5639.31, "total_tokens": 20987120} {"current_steps": 32155, "total_steps": 33920, "loss": 0.2368, "lr": 8.234339865956342e-08, "epoch": 18.95931603773585, "percentage": 94.8, "elapsed_time": "1:02:02", "remaining_time": "0:03:24", "throughput": 5639.29, "total_tokens": 20990192} {"current_steps": 32160, "total_steps": 33920, "loss": 0.2239, "lr": 8.187906305054838e-08, "epoch": 18.962264150943398, "percentage": 94.81, "elapsed_time": "1:02:02", "remaining_time": "0:03:23", "throughput": 5639.29, "total_tokens": 20993264} {"current_steps": 32165, "total_steps": 33920, "loss": 0.2199, "lr": 8.141602953524841e-08, "epoch": 18.965212264150942, "percentage": 94.83, "elapsed_time": "1:02:03", "remaining_time": "0:03:23", "throughput": 5639.21, "total_tokens": 20995984} {"current_steps": 32170, "total_steps": 33920, "loss": 0.3432, "lr": 8.095429823625212e-08, "epoch": 18.96816037735849, "percentage": 94.84, "elapsed_time": "1:02:03", "remaining_time": "0:03:22", "throughput": 5639.14, "total_tokens": 20998672} {"current_steps": 32175, "total_steps": 33920, "loss": 0.2767, "lr": 8.04938692758045e-08, "epoch": 18.97110849056604, "percentage": 94.86, "elapsed_time": "1:02:04", "remaining_time": "0:03:21", "throughput": 5639.28, "total_tokens": 21002256} {"current_steps": 32180, "total_steps": 33920, "loss": 0.344, "lr": 8.003474277580803e-08, "epoch": 18.974056603773583, "percentage": 94.87, "elapsed_time": "1:02:04", "remaining_time": "0:03:21", "throughput": 5639.33, "total_tokens": 21005616} {"current_steps": 32185, "total_steps": 33920, "loss": 0.3489, "lr": 7.95769188578166e-08, "epoch": 18.97700471698113, "percentage": 94.89, "elapsed_time": "1:02:05", "remaining_time": "0:03:20", "throughput": 5639.41, "total_tokens": 21008976} {"current_steps": 32190, "total_steps": 33920, "loss": 0.4761, "lr": 7.912039764304213e-08, "epoch": 18.97995283018868, "percentage": 94.9, "elapsed_time": "1:02:05", "remaining_time": "0:03:20", "throughput": 5639.37, "total_tokens": 21011728} {"current_steps": 32195, "total_steps": 33920, "loss": 0.3162, "lr": 7.866517925235017e-08, "epoch": 18.982900943396228, "percentage": 94.91, "elapsed_time": "1:02:06", "remaining_time": "0:03:19", "throughput": 5639.49, "total_tokens": 21015312} {"current_steps": 32200, "total_steps": 33920, "loss": 0.2954, "lr": 7.821126380626154e-08, "epoch": 18.985849056603772, "percentage": 94.93, "elapsed_time": "1:02:06", "remaining_time": "0:03:19", "throughput": 5639.53, "total_tokens": 21018160} {"current_steps": 32205, "total_steps": 33920, "loss": 0.2075, "lr": 7.775865142495286e-08, "epoch": 18.98879716981132, "percentage": 94.94, "elapsed_time": "1:02:07", "remaining_time": "0:03:18", "throughput": 5639.54, "total_tokens": 21020976} {"current_steps": 32210, "total_steps": 33920, "loss": 0.3183, "lr": 7.730734222825442e-08, "epoch": 18.99174528301887, "percentage": 94.96, "elapsed_time": "1:02:07", "remaining_time": "0:03:17", "throughput": 5639.59, "total_tokens": 21024240} {"current_steps": 32215, "total_steps": 33920, "loss": 0.1867, "lr": 7.68573363356534e-08, "epoch": 18.994693396226417, "percentage": 94.97, "elapsed_time": "1:02:08", "remaining_time": "0:03:17", "throughput": 5639.77, "total_tokens": 21028400} {"current_steps": 32220, "total_steps": 33920, "loss": 0.2273, "lr": 7.640863386629005e-08, "epoch": 18.99764150943396, "percentage": 94.99, "elapsed_time": "1:02:09", "remaining_time": "0:03:16", "throughput": 5639.77, "total_tokens": 21032048} {"current_steps": 32225, "total_steps": 33920, "loss": 0.3804, "lr": 7.59612349389599e-08, "epoch": 19.00058962264151, "percentage": 95.0, "elapsed_time": "1:02:10", "remaining_time": "0:03:16", "throughput": 5639.24, "total_tokens": 21034792} {"current_steps": 32230, "total_steps": 33920, "loss": 0.356, "lr": 7.551513967211433e-08, "epoch": 19.003537735849058, "percentage": 95.02, "elapsed_time": "1:02:10", "remaining_time": "0:03:15", "throughput": 5639.26, "total_tokens": 21037768} {"current_steps": 32235, "total_steps": 33920, "loss": 0.2647, "lr": 7.507034818385883e-08, "epoch": 19.006485849056602, "percentage": 95.03, "elapsed_time": "1:02:11", "remaining_time": "0:03:15", "throughput": 5639.12, "total_tokens": 21040552} {"current_steps": 32240, "total_steps": 33920, "loss": 0.2797, "lr": 7.462686059195423e-08, "epoch": 19.00943396226415, "percentage": 95.05, "elapsed_time": "1:02:11", "remaining_time": "0:03:14", "throughput": 5639.09, "total_tokens": 21043368} {"current_steps": 32245, "total_steps": 33920, "loss": 0.3193, "lr": 7.418467701381548e-08, "epoch": 19.0123820754717, "percentage": 95.06, "elapsed_time": "1:02:12", "remaining_time": "0:03:13", "throughput": 5638.99, "total_tokens": 21045928} {"current_steps": 32250, "total_steps": 33920, "loss": 0.2731, "lr": 7.374379756651285e-08, "epoch": 19.015330188679247, "percentage": 95.08, "elapsed_time": "1:02:12", "remaining_time": "0:03:13", "throughput": 5638.9, "total_tokens": 21048616} {"current_steps": 32255, "total_steps": 33920, "loss": 0.2961, "lr": 7.330422236677015e-08, "epoch": 19.01827830188679, "percentage": 95.09, "elapsed_time": "1:02:13", "remaining_time": "0:03:12", "throughput": 5638.87, "total_tokens": 21051304} {"current_steps": 32260, "total_steps": 33920, "loss": 0.4085, "lr": 7.286595153096765e-08, "epoch": 19.02122641509434, "percentage": 95.11, "elapsed_time": "1:02:13", "remaining_time": "0:03:12", "throughput": 5638.95, "total_tokens": 21054856} {"current_steps": 32265, "total_steps": 33920, "loss": 0.3108, "lr": 7.242898517513864e-08, "epoch": 19.024174528301888, "percentage": 95.12, "elapsed_time": "1:02:14", "remaining_time": "0:03:11", "throughput": 5638.99, "total_tokens": 21057832} {"current_steps": 32270, "total_steps": 33920, "loss": 0.2392, "lr": 7.199332341497333e-08, "epoch": 19.027122641509433, "percentage": 95.14, "elapsed_time": "1:02:14", "remaining_time": "0:03:10", "throughput": 5639.03, "total_tokens": 21060968} {"current_steps": 32275, "total_steps": 33920, "loss": 0.2418, "lr": 7.155896636581394e-08, "epoch": 19.03007075471698, "percentage": 95.15, "elapsed_time": "1:02:15", "remaining_time": "0:03:10", "throughput": 5639.04, "total_tokens": 21064232} {"current_steps": 32280, "total_steps": 33920, "loss": 0.2453, "lr": 7.112591414265901e-08, "epoch": 19.03301886792453, "percentage": 95.17, "elapsed_time": "1:02:15", "remaining_time": "0:03:09", "throughput": 5638.94, "total_tokens": 21066792} {"current_steps": 32285, "total_steps": 33920, "loss": 0.4086, "lr": 7.069416686016018e-08, "epoch": 19.035966981132077, "percentage": 95.18, "elapsed_time": "1:02:16", "remaining_time": "0:03:09", "throughput": 5638.86, "total_tokens": 21069288} {"current_steps": 32290, "total_steps": 33920, "loss": 0.2938, "lr": 7.026372463262488e-08, "epoch": 19.03891509433962, "percentage": 95.19, "elapsed_time": "1:02:17", "remaining_time": "0:03:08", "throughput": 5639.01, "total_tokens": 21073544} {"current_steps": 32295, "total_steps": 33920, "loss": 0.307, "lr": 6.983458757401418e-08, "epoch": 19.04186320754717, "percentage": 95.21, "elapsed_time": "1:02:17", "remaining_time": "0:03:08", "throughput": 5639.09, "total_tokens": 21077096} {"current_steps": 32300, "total_steps": 33920, "loss": 0.3095, "lr": 6.940675579794443e-08, "epoch": 19.044811320754718, "percentage": 95.22, "elapsed_time": "1:02:18", "remaining_time": "0:03:07", "throughput": 5639.11, "total_tokens": 21080104} {"current_steps": 32305, "total_steps": 33920, "loss": 0.2692, "lr": 6.898022941768612e-08, "epoch": 19.047759433962263, "percentage": 95.24, "elapsed_time": "1:02:18", "remaining_time": "0:03:06", "throughput": 5639.19, "total_tokens": 21083304} {"current_steps": 32310, "total_steps": 33920, "loss": 0.3282, "lr": 6.855500854616337e-08, "epoch": 19.05070754716981, "percentage": 95.25, "elapsed_time": "1:02:19", "remaining_time": "0:03:06", "throughput": 5639.26, "total_tokens": 21086920} {"current_steps": 32315, "total_steps": 33920, "loss": 0.3242, "lr": 6.813109329595557e-08, "epoch": 19.05365566037736, "percentage": 95.27, "elapsed_time": "1:02:19", "remaining_time": "0:03:05", "throughput": 5639.36, "total_tokens": 21090952} {"current_steps": 32320, "total_steps": 33920, "loss": 0.3587, "lr": 6.770848377929573e-08, "epoch": 19.056603773584907, "percentage": 95.28, "elapsed_time": "1:02:20", "remaining_time": "0:03:05", "throughput": 5639.49, "total_tokens": 21095336} {"current_steps": 32325, "total_steps": 33920, "loss": 0.3279, "lr": 6.728718010807156e-08, "epoch": 19.059551886792452, "percentage": 95.3, "elapsed_time": "1:02:21", "remaining_time": "0:03:04", "throughput": 5639.46, "total_tokens": 21098120} {"current_steps": 32330, "total_steps": 33920, "loss": 0.2359, "lr": 6.68671823938255e-08, "epoch": 19.0625, "percentage": 95.31, "elapsed_time": "1:02:21", "remaining_time": "0:03:04", "throughput": 5639.46, "total_tokens": 21101096} {"current_steps": 32335, "total_steps": 33920, "loss": 0.3963, "lr": 6.644849074775361e-08, "epoch": 19.065448113207548, "percentage": 95.33, "elapsed_time": "1:02:22", "remaining_time": "0:03:03", "throughput": 5639.41, "total_tokens": 21104072} {"current_steps": 32340, "total_steps": 33920, "loss": 0.277, "lr": 6.603110528070667e-08, "epoch": 19.068396226415093, "percentage": 95.34, "elapsed_time": "1:02:22", "remaining_time": "0:03:02", "throughput": 5639.44, "total_tokens": 21107176} {"current_steps": 32345, "total_steps": 33920, "loss": 0.2613, "lr": 6.561502610318849e-08, "epoch": 19.07134433962264, "percentage": 95.36, "elapsed_time": "1:02:23", "remaining_time": "0:03:02", "throughput": 5639.44, "total_tokens": 21110056} {"current_steps": 32350, "total_steps": 33920, "loss": 0.2424, "lr": 6.520025332535762e-08, "epoch": 19.07429245283019, "percentage": 95.37, "elapsed_time": "1:02:23", "remaining_time": "0:03:01", "throughput": 5639.47, "total_tokens": 21113416} {"current_steps": 32355, "total_steps": 33920, "loss": 0.2071, "lr": 6.47867870570279e-08, "epoch": 19.077240566037737, "percentage": 95.39, "elapsed_time": "1:02:24", "remaining_time": "0:03:01", "throughput": 5639.52, "total_tokens": 21116648} {"current_steps": 32360, "total_steps": 33920, "loss": 0.2245, "lr": 6.437462740766564e-08, "epoch": 19.080188679245282, "percentage": 95.4, "elapsed_time": "1:02:24", "remaining_time": "0:03:00", "throughput": 5639.68, "total_tokens": 21120488} {"current_steps": 32365, "total_steps": 33920, "loss": 0.2974, "lr": 6.396377448639246e-08, "epoch": 19.08313679245283, "percentage": 95.42, "elapsed_time": "1:02:25", "remaining_time": "0:02:59", "throughput": 5639.71, "total_tokens": 21123688} {"current_steps": 32370, "total_steps": 33920, "loss": 0.2927, "lr": 6.3554228401983e-08, "epoch": 19.08608490566038, "percentage": 95.43, "elapsed_time": "1:02:26", "remaining_time": "0:02:59", "throughput": 5639.7, "total_tokens": 21126760} {"current_steps": 32375, "total_steps": 33920, "loss": 0.2894, "lr": 6.314598926286663e-08, "epoch": 19.089033018867923, "percentage": 95.45, "elapsed_time": "1:02:26", "remaining_time": "0:02:58", "throughput": 5639.53, "total_tokens": 21129224} {"current_steps": 32380, "total_steps": 33920, "loss": 0.2526, "lr": 6.273905717712637e-08, "epoch": 19.09198113207547, "percentage": 95.46, "elapsed_time": "1:02:27", "remaining_time": "0:02:58", "throughput": 5639.5, "total_tokens": 21132072} {"current_steps": 32385, "total_steps": 33920, "loss": 0.3588, "lr": 6.233343225249933e-08, "epoch": 19.09492924528302, "percentage": 95.47, "elapsed_time": "1:02:27", "remaining_time": "0:02:57", "throughput": 5639.55, "total_tokens": 21135592} {"current_steps": 32390, "total_steps": 33920, "loss": 0.4374, "lr": 6.192911459637519e-08, "epoch": 19.097877358490567, "percentage": 95.49, "elapsed_time": "1:02:28", "remaining_time": "0:02:57", "throughput": 5639.63, "total_tokens": 21138824} {"current_steps": 32395, "total_steps": 33920, "loss": 0.2376, "lr": 6.152610431580052e-08, "epoch": 19.100825471698112, "percentage": 95.5, "elapsed_time": "1:02:28", "remaining_time": "0:02:56", "throughput": 5639.68, "total_tokens": 21141896} {"current_steps": 32400, "total_steps": 33920, "loss": 0.2266, "lr": 6.112440151747389e-08, "epoch": 19.10377358490566, "percentage": 95.52, "elapsed_time": "1:02:29", "remaining_time": "0:02:55", "throughput": 5639.8, "total_tokens": 21145448} {"current_steps": 32405, "total_steps": 33920, "loss": 0.3065, "lr": 6.072400630774689e-08, "epoch": 19.10672169811321, "percentage": 95.53, "elapsed_time": "1:02:29", "remaining_time": "0:02:55", "throughput": 5639.87, "total_tokens": 21148616} {"current_steps": 32410, "total_steps": 33920, "loss": 0.3904, "lr": 6.032491879262637e-08, "epoch": 19.109669811320753, "percentage": 95.55, "elapsed_time": "1:02:30", "remaining_time": "0:02:54", "throughput": 5639.88, "total_tokens": 21151816} {"current_steps": 32415, "total_steps": 33920, "loss": 0.2691, "lr": 5.99271390777717e-08, "epoch": 19.1126179245283, "percentage": 95.56, "elapsed_time": "1:02:31", "remaining_time": "0:02:54", "throughput": 5639.98, "total_tokens": 21155656} {"current_steps": 32420, "total_steps": 33920, "loss": 0.2806, "lr": 5.953066726849865e-08, "epoch": 19.11556603773585, "percentage": 95.58, "elapsed_time": "1:02:31", "remaining_time": "0:02:53", "throughput": 5640.05, "total_tokens": 21159144} {"current_steps": 32425, "total_steps": 33920, "loss": 0.2503, "lr": 5.913550346977326e-08, "epoch": 19.118514150943398, "percentage": 95.59, "elapsed_time": "1:02:32", "remaining_time": "0:02:53", "throughput": 5640.25, "total_tokens": 21164616} {"current_steps": 32430, "total_steps": 33920, "loss": 0.4119, "lr": 5.874164778621683e-08, "epoch": 19.121462264150942, "percentage": 95.61, "elapsed_time": "1:02:32", "remaining_time": "0:02:52", "throughput": 5640.18, "total_tokens": 21167176} {"current_steps": 32435, "total_steps": 33920, "loss": 0.3008, "lr": 5.834910032210539e-08, "epoch": 19.12441037735849, "percentage": 95.62, "elapsed_time": "1:02:33", "remaining_time": "0:02:51", "throughput": 5640.12, "total_tokens": 21169736} {"current_steps": 32440, "total_steps": 33920, "loss": 0.361, "lr": 5.795786118136693e-08, "epoch": 19.12735849056604, "percentage": 95.64, "elapsed_time": "1:02:33", "remaining_time": "0:02:51", "throughput": 5640.11, "total_tokens": 21172520} {"current_steps": 32445, "total_steps": 33920, "loss": 0.3234, "lr": 5.756793046758302e-08, "epoch": 19.130306603773583, "percentage": 95.65, "elapsed_time": "1:02:34", "remaining_time": "0:02:50", "throughput": 5640.02, "total_tokens": 21175048} {"current_steps": 32450, "total_steps": 33920, "loss": 0.3188, "lr": 5.7179308283990544e-08, "epoch": 19.13325471698113, "percentage": 95.67, "elapsed_time": "1:02:34", "remaining_time": "0:02:50", "throughput": 5639.95, "total_tokens": 21177672} {"current_steps": 32455, "total_steps": 33920, "loss": 0.3806, "lr": 5.679199473347885e-08, "epoch": 19.13620283018868, "percentage": 95.68, "elapsed_time": "1:02:35", "remaining_time": "0:02:49", "throughput": 5639.93, "total_tokens": 21180712} {"current_steps": 32460, "total_steps": 33920, "loss": 0.4888, "lr": 5.6405989918590366e-08, "epoch": 19.139150943396228, "percentage": 95.7, "elapsed_time": "1:02:36", "remaining_time": "0:02:48", "throughput": 5639.97, "total_tokens": 21184872} {"current_steps": 32465, "total_steps": 33920, "loss": 0.3319, "lr": 5.6021293941522225e-08, "epoch": 19.142099056603772, "percentage": 95.71, "elapsed_time": "1:02:36", "remaining_time": "0:02:48", "throughput": 5639.94, "total_tokens": 21187784} {"current_steps": 32470, "total_steps": 33920, "loss": 0.2975, "lr": 5.563790690412352e-08, "epoch": 19.14504716981132, "percentage": 95.73, "elapsed_time": "1:02:37", "remaining_time": "0:02:47", "throughput": 5640.1, "total_tokens": 21191656} {"current_steps": 32475, "total_steps": 33920, "loss": 0.2556, "lr": 5.525582890789805e-08, "epoch": 19.14799528301887, "percentage": 95.74, "elapsed_time": "1:02:37", "remaining_time": "0:02:47", "throughput": 5640.14, "total_tokens": 21194792} {"current_steps": 32480, "total_steps": 33920, "loss": 0.3273, "lr": 5.4875060054002115e-08, "epoch": 19.150943396226417, "percentage": 95.75, "elapsed_time": "1:02:38", "remaining_time": "0:02:46", "throughput": 5640.14, "total_tokens": 21197640} {"current_steps": 32485, "total_steps": 33920, "loss": 0.3259, "lr": 5.4495600443246755e-08, "epoch": 19.15389150943396, "percentage": 95.77, "elapsed_time": "1:02:39", "remaining_time": "0:02:46", "throughput": 5640.29, "total_tokens": 21202056} {"current_steps": 32490, "total_steps": 33920, "loss": 0.4404, "lr": 5.411745017609493e-08, "epoch": 19.15683962264151, "percentage": 95.78, "elapsed_time": "1:02:39", "remaining_time": "0:02:45", "throughput": 5640.37, "total_tokens": 21205192} {"current_steps": 32495, "total_steps": 33920, "loss": 0.1705, "lr": 5.374060935266434e-08, "epoch": 19.159787735849058, "percentage": 95.8, "elapsed_time": "1:02:40", "remaining_time": "0:02:44", "throughput": 5640.32, "total_tokens": 21207880} {"current_steps": 32500, "total_steps": 33920, "loss": 0.2481, "lr": 5.3365078072724065e-08, "epoch": 19.162735849056602, "percentage": 95.81, "elapsed_time": "1:02:40", "remaining_time": "0:02:44", "throughput": 5640.4, "total_tokens": 21211112} {"current_steps": 32505, "total_steps": 33920, "loss": 0.306, "lr": 5.299085643569846e-08, "epoch": 19.16568396226415, "percentage": 95.83, "elapsed_time": "1:02:41", "remaining_time": "0:02:43", "throughput": 5640.42, "total_tokens": 21214184} {"current_steps": 32510, "total_steps": 33920, "loss": 0.4544, "lr": 5.261794454066327e-08, "epoch": 19.1686320754717, "percentage": 95.84, "elapsed_time": "1:02:41", "remaining_time": "0:02:43", "throughput": 5640.4, "total_tokens": 21217128} {"current_steps": 32515, "total_steps": 33920, "loss": 0.2095, "lr": 5.224634248635008e-08, "epoch": 19.171580188679247, "percentage": 95.86, "elapsed_time": "1:02:42", "remaining_time": "0:02:42", "throughput": 5640.44, "total_tokens": 21220616} {"current_steps": 32520, "total_steps": 33920, "loss": 0.2812, "lr": 5.187605037114129e-08, "epoch": 19.17452830188679, "percentage": 95.87, "elapsed_time": "1:02:42", "remaining_time": "0:02:41", "throughput": 5640.5, "total_tokens": 21224168} {"current_steps": 32525, "total_steps": 33920, "loss": 0.3054, "lr": 5.15070682930735e-08, "epoch": 19.17747641509434, "percentage": 95.89, "elapsed_time": "1:02:43", "remaining_time": "0:02:41", "throughput": 5640.66, "total_tokens": 21227944} {"current_steps": 32530, "total_steps": 33920, "loss": 0.3258, "lr": 5.113939634983578e-08, "epoch": 19.180424528301888, "percentage": 95.9, "elapsed_time": "1:02:43", "remaining_time": "0:02:40", "throughput": 5640.52, "total_tokens": 21230184} {"current_steps": 32535, "total_steps": 33920, "loss": 0.266, "lr": 5.077303463877192e-08, "epoch": 19.183372641509433, "percentage": 95.92, "elapsed_time": "1:02:44", "remaining_time": "0:02:40", "throughput": 5640.54, "total_tokens": 21233768} {"current_steps": 32540, "total_steps": 33920, "loss": 0.4034, "lr": 5.040798325687601e-08, "epoch": 19.18632075471698, "percentage": 95.93, "elapsed_time": "1:02:45", "remaining_time": "0:02:39", "throughput": 5640.66, "total_tokens": 21237224} {"current_steps": 32545, "total_steps": 33920, "loss": 0.2871, "lr": 5.004424230079852e-08, "epoch": 19.18926886792453, "percentage": 95.95, "elapsed_time": "1:02:45", "remaining_time": "0:02:39", "throughput": 5640.63, "total_tokens": 21240392} {"current_steps": 32550, "total_steps": 33920, "loss": 0.2167, "lr": 4.968181186684129e-08, "epoch": 19.192216981132077, "percentage": 95.96, "elapsed_time": "1:02:46", "remaining_time": "0:02:38", "throughput": 5640.72, "total_tokens": 21243880} {"current_steps": 32555, "total_steps": 33920, "loss": 0.3156, "lr": 4.932069205095924e-08, "epoch": 19.19516509433962, "percentage": 95.98, "elapsed_time": "1:02:46", "remaining_time": "0:02:37", "throughput": 5640.86, "total_tokens": 21247592} {"current_steps": 32560, "total_steps": 33920, "loss": 0.3853, "lr": 4.896088294875978e-08, "epoch": 19.19811320754717, "percentage": 95.99, "elapsed_time": "1:02:47", "remaining_time": "0:02:37", "throughput": 5640.75, "total_tokens": 21250056} {"current_steps": 32565, "total_steps": 33920, "loss": 0.3021, "lr": 4.8602384655505044e-08, "epoch": 19.201061320754718, "percentage": 96.01, "elapsed_time": "1:02:47", "remaining_time": "0:02:36", "throughput": 5640.7, "total_tokens": 21252872} {"current_steps": 32570, "total_steps": 33920, "loss": 0.3121, "lr": 4.824519726610744e-08, "epoch": 19.204009433962263, "percentage": 96.02, "elapsed_time": "1:02:48", "remaining_time": "0:02:36", "throughput": 5640.87, "total_tokens": 21256904} {"current_steps": 32575, "total_steps": 33920, "loss": 0.2636, "lr": 4.7889320875135206e-08, "epoch": 19.20695754716981, "percentage": 96.03, "elapsed_time": "1:02:48", "remaining_time": "0:02:35", "throughput": 5640.82, "total_tokens": 21259848} {"current_steps": 32580, "total_steps": 33920, "loss": 0.3051, "lr": 4.753475557680742e-08, "epoch": 19.20990566037736, "percentage": 96.05, "elapsed_time": "1:02:49", "remaining_time": "0:02:35", "throughput": 5640.82, "total_tokens": 21262760} {"current_steps": 32585, "total_steps": 33920, "loss": 0.2632, "lr": 4.718150146499734e-08, "epoch": 19.212853773584907, "percentage": 96.06, "elapsed_time": "1:02:49", "remaining_time": "0:02:34", "throughput": 5640.85, "total_tokens": 21265928} {"current_steps": 32590, "total_steps": 33920, "loss": 0.2068, "lr": 4.682955863323013e-08, "epoch": 19.215801886792452, "percentage": 96.08, "elapsed_time": "1:02:50", "remaining_time": "0:02:33", "throughput": 5640.75, "total_tokens": 21268936} {"current_steps": 32595, "total_steps": 33920, "loss": 0.2969, "lr": 4.6478927174684606e-08, "epoch": 19.21875, "percentage": 96.09, "elapsed_time": "1:02:51", "remaining_time": "0:02:33", "throughput": 5640.77, "total_tokens": 21271912} {"current_steps": 32600, "total_steps": 33920, "loss": 0.273, "lr": 4.612960718219095e-08, "epoch": 19.221698113207548, "percentage": 96.11, "elapsed_time": "1:02:51", "remaining_time": "0:02:32", "throughput": 5640.63, "total_tokens": 21274536} {"current_steps": 32605, "total_steps": 33920, "loss": 0.2829, "lr": 4.578159874823407e-08, "epoch": 19.224646226415093, "percentage": 96.12, "elapsed_time": "1:02:52", "remaining_time": "0:02:32", "throughput": 5640.77, "total_tokens": 21278792} {"current_steps": 32610, "total_steps": 33920, "loss": 0.2358, "lr": 4.5434901964950264e-08, "epoch": 19.22759433962264, "percentage": 96.14, "elapsed_time": "1:02:52", "remaining_time": "0:02:31", "throughput": 5640.72, "total_tokens": 21281544} {"current_steps": 32615, "total_steps": 33920, "loss": 0.4405, "lr": 4.508951692412944e-08, "epoch": 19.23054245283019, "percentage": 96.15, "elapsed_time": "1:02:53", "remaining_time": "0:02:30", "throughput": 5640.78, "total_tokens": 21284712} {"current_steps": 32620, "total_steps": 33920, "loss": 0.2929, "lr": 4.4745443717213455e-08, "epoch": 19.233490566037737, "percentage": 96.17, "elapsed_time": "1:02:53", "remaining_time": "0:02:30", "throughput": 5640.87, "total_tokens": 21288232} {"current_steps": 32625, "total_steps": 33920, "loss": 0.2574, "lr": 4.4402682435296666e-08, "epoch": 19.236438679245282, "percentage": 96.18, "elapsed_time": "1:02:54", "remaining_time": "0:02:29", "throughput": 5640.94, "total_tokens": 21292040} {"current_steps": 32630, "total_steps": 33920, "loss": 0.3215, "lr": 4.406123316912758e-08, "epoch": 19.23938679245283, "percentage": 96.2, "elapsed_time": "1:02:55", "remaining_time": "0:02:29", "throughput": 5641.06, "total_tokens": 21295528} {"current_steps": 32635, "total_steps": 33920, "loss": 0.1895, "lr": 4.372109600910612e-08, "epoch": 19.24233490566038, "percentage": 96.21, "elapsed_time": "1:02:55", "remaining_time": "0:02:28", "throughput": 5641.03, "total_tokens": 21298216} {"current_steps": 32640, "total_steps": 33920, "loss": 0.2654, "lr": 4.338227104528414e-08, "epoch": 19.245283018867923, "percentage": 96.23, "elapsed_time": "1:02:56", "remaining_time": "0:02:28", "throughput": 5641.08, "total_tokens": 21301352} {"current_steps": 32645, "total_steps": 33920, "loss": 0.4293, "lr": 4.304475836736821e-08, "epoch": 19.24823113207547, "percentage": 96.24, "elapsed_time": "1:02:56", "remaining_time": "0:02:27", "throughput": 5640.97, "total_tokens": 21303720} {"current_steps": 32650, "total_steps": 33920, "loss": 0.405, "lr": 4.27085580647163e-08, "epoch": 19.25117924528302, "percentage": 96.26, "elapsed_time": "1:02:57", "remaining_time": "0:02:26", "throughput": 5641.01, "total_tokens": 21306760} {"current_steps": 32655, "total_steps": 33920, "loss": 0.342, "lr": 4.237367022633776e-08, "epoch": 19.254127358490567, "percentage": 96.27, "elapsed_time": "1:02:57", "remaining_time": "0:02:26", "throughput": 5641.22, "total_tokens": 21311752} {"current_steps": 32660, "total_steps": 33920, "loss": 0.2638, "lr": 4.204009494089612e-08, "epoch": 19.257075471698112, "percentage": 96.29, "elapsed_time": "1:02:58", "remaining_time": "0:02:25", "throughput": 5641.18, "total_tokens": 21314696} {"current_steps": 32665, "total_steps": 33920, "loss": 0.2289, "lr": 4.170783229670739e-08, "epoch": 19.26002358490566, "percentage": 96.3, "elapsed_time": "1:02:58", "remaining_time": "0:02:25", "throughput": 5641.22, "total_tokens": 21317960} {"current_steps": 32670, "total_steps": 33920, "loss": 0.2801, "lr": 4.137688238173898e-08, "epoch": 19.26297169811321, "percentage": 96.31, "elapsed_time": "1:02:59", "remaining_time": "0:02:24", "throughput": 5641.27, "total_tokens": 21322024} {"current_steps": 32675, "total_steps": 33920, "loss": 0.2995, "lr": 4.104724528361137e-08, "epoch": 19.265919811320753, "percentage": 96.33, "elapsed_time": "1:03:00", "remaining_time": "0:02:24", "throughput": 5641.26, "total_tokens": 21325384} {"current_steps": 32680, "total_steps": 33920, "loss": 0.3396, "lr": 4.071892108959752e-08, "epoch": 19.2688679245283, "percentage": 96.34, "elapsed_time": "1:03:00", "remaining_time": "0:02:23", "throughput": 5641.33, "total_tokens": 21328680} {"current_steps": 32685, "total_steps": 33920, "loss": 0.2063, "lr": 4.039190988662234e-08, "epoch": 19.27181603773585, "percentage": 96.36, "elapsed_time": "1:03:01", "remaining_time": "0:02:22", "throughput": 5641.3, "total_tokens": 21331432} {"current_steps": 32690, "total_steps": 33920, "loss": 0.2236, "lr": 4.006621176126435e-08, "epoch": 19.274764150943398, "percentage": 96.37, "elapsed_time": "1:03:01", "remaining_time": "0:02:22", "throughput": 5641.37, "total_tokens": 21334728} {"current_steps": 32695, "total_steps": 33920, "loss": 0.3599, "lr": 3.974182679975236e-08, "epoch": 19.277712264150942, "percentage": 96.39, "elapsed_time": "1:03:02", "remaining_time": "0:02:21", "throughput": 5641.42, "total_tokens": 21338376} {"current_steps": 32700, "total_steps": 33920, "loss": 0.2961, "lr": 3.941875508796933e-08, "epoch": 19.28066037735849, "percentage": 96.4, "elapsed_time": "1:03:02", "remaining_time": "0:02:21", "throughput": 5641.35, "total_tokens": 21341032} {"current_steps": 32705, "total_steps": 33920, "loss": 0.281, "lr": 3.909699671145017e-08, "epoch": 19.28360849056604, "percentage": 96.42, "elapsed_time": "1:03:03", "remaining_time": "0:02:20", "throughput": 5641.38, "total_tokens": 21344264} {"current_steps": 32710, "total_steps": 33920, "loss": 0.3551, "lr": 3.87765517553812e-08, "epoch": 19.286556603773583, "percentage": 96.43, "elapsed_time": "1:03:04", "remaining_time": "0:02:19", "throughput": 5641.35, "total_tokens": 21346920} {"current_steps": 32715, "total_steps": 33920, "loss": 0.3673, "lr": 3.8457420304601756e-08, "epoch": 19.28950471698113, "percentage": 96.45, "elapsed_time": "1:03:04", "remaining_time": "0:02:19", "throughput": 5641.37, "total_tokens": 21349896} {"current_steps": 32720, "total_steps": 33920, "loss": 0.2812, "lr": 3.813960244360371e-08, "epoch": 19.29245283018868, "percentage": 96.46, "elapsed_time": "1:03:05", "remaining_time": "0:02:18", "throughput": 5641.33, "total_tokens": 21352808} {"current_steps": 32725, "total_steps": 33920, "loss": 0.3668, "lr": 3.7823098256529744e-08, "epoch": 19.295400943396228, "percentage": 96.48, "elapsed_time": "1:03:05", "remaining_time": "0:02:18", "throughput": 5641.35, "total_tokens": 21356136} {"current_steps": 32730, "total_steps": 33920, "loss": 0.3403, "lr": 3.750790782717673e-08, "epoch": 19.298349056603772, "percentage": 96.49, "elapsed_time": "1:03:06", "remaining_time": "0:02:17", "throughput": 5641.54, "total_tokens": 21360808} {"current_steps": 32735, "total_steps": 33920, "loss": 0.2883, "lr": 3.719403123899179e-08, "epoch": 19.30129716981132, "percentage": 96.51, "elapsed_time": "1:03:06", "remaining_time": "0:02:17", "throughput": 5641.52, "total_tokens": 21363464} {"current_steps": 32740, "total_steps": 33920, "loss": 0.2235, "lr": 3.688146857507624e-08, "epoch": 19.30424528301887, "percentage": 96.52, "elapsed_time": "1:03:07", "remaining_time": "0:02:16", "throughput": 5641.71, "total_tokens": 21368104} {"current_steps": 32745, "total_steps": 33920, "loss": 0.4012, "lr": 3.657021991818166e-08, "epoch": 19.307193396226417, "percentage": 96.54, "elapsed_time": "1:03:08", "remaining_time": "0:02:15", "throughput": 5641.63, "total_tokens": 21370824} {"current_steps": 32750, "total_steps": 33920, "loss": 0.2299, "lr": 3.626028535071213e-08, "epoch": 19.31014150943396, "percentage": 96.55, "elapsed_time": "1:03:08", "remaining_time": "0:02:15", "throughput": 5641.6, "total_tokens": 21373512} {"current_steps": 32755, "total_steps": 33920, "loss": 0.2486, "lr": 3.59516649547248e-08, "epoch": 19.31308962264151, "percentage": 96.57, "elapsed_time": "1:03:09", "remaining_time": "0:02:14", "throughput": 5641.64, "total_tokens": 21376552} {"current_steps": 32760, "total_steps": 33920, "loss": 0.2959, "lr": 3.564435881192818e-08, "epoch": 19.316037735849058, "percentage": 96.58, "elapsed_time": "1:03:09", "remaining_time": "0:02:14", "throughput": 5641.57, "total_tokens": 21379368} {"current_steps": 32765, "total_steps": 33920, "loss": 0.2732, "lr": 3.5338367003682763e-08, "epoch": 19.318985849056602, "percentage": 96.59, "elapsed_time": "1:03:10", "remaining_time": "0:02:13", "throughput": 5641.59, "total_tokens": 21382888} {"current_steps": 32770, "total_steps": 33920, "loss": 0.2127, "lr": 3.5033689611000954e-08, "epoch": 19.32193396226415, "percentage": 96.61, "elapsed_time": "1:03:10", "remaining_time": "0:02:13", "throughput": 5641.54, "total_tokens": 21385768} {"current_steps": 32775, "total_steps": 33920, "loss": 0.4212, "lr": 3.473032671454768e-08, "epoch": 19.3248820754717, "percentage": 96.62, "elapsed_time": "1:03:11", "remaining_time": "0:02:12", "throughput": 5641.57, "total_tokens": 21388904} {"current_steps": 32780, "total_steps": 33920, "loss": 0.2825, "lr": 3.44282783946398e-08, "epoch": 19.327830188679247, "percentage": 96.64, "elapsed_time": "1:03:11", "remaining_time": "0:02:11", "throughput": 5641.48, "total_tokens": 21391624} {"current_steps": 32785, "total_steps": 33920, "loss": 0.3603, "lr": 3.4127544731245575e-08, "epoch": 19.33077830188679, "percentage": 96.65, "elapsed_time": "1:03:12", "remaining_time": "0:02:11", "throughput": 5641.61, "total_tokens": 21395912} {"current_steps": 32790, "total_steps": 33920, "loss": 0.1849, "lr": 3.38281258039852e-08, "epoch": 19.33372641509434, "percentage": 96.67, "elapsed_time": "1:03:13", "remaining_time": "0:02:10", "throughput": 5641.68, "total_tokens": 21399496} {"current_steps": 32795, "total_steps": 33920, "loss": 0.303, "lr": 3.353002169213193e-08, "epoch": 19.336674528301888, "percentage": 96.68, "elapsed_time": "1:03:13", "remaining_time": "0:02:10", "throughput": 5641.61, "total_tokens": 21402088} {"current_steps": 32800, "total_steps": 33920, "loss": 0.4208, "lr": 3.32332324746093e-08, "epoch": 19.339622641509433, "percentage": 96.7, "elapsed_time": "1:03:14", "remaining_time": "0:02:09", "throughput": 5641.56, "total_tokens": 21404936} {"current_steps": 32805, "total_steps": 33920, "loss": 0.3071, "lr": 3.2937758229994455e-08, "epoch": 19.34257075471698, "percentage": 96.71, "elapsed_time": "1:03:14", "remaining_time": "0:02:08", "throughput": 5641.67, "total_tokens": 21408680} {"current_steps": 32810, "total_steps": 33920, "loss": 0.2711, "lr": 3.2643599036514815e-08, "epoch": 19.34551886792453, "percentage": 96.73, "elapsed_time": "1:03:15", "remaining_time": "0:02:08", "throughput": 5641.65, "total_tokens": 21412072} {"current_steps": 32815, "total_steps": 33920, "loss": 0.2704, "lr": 3.2350754972050316e-08, "epoch": 19.348466981132077, "percentage": 96.74, "elapsed_time": "1:03:15", "remaining_time": "0:02:07", "throughput": 5641.64, "total_tokens": 21415016} {"current_steps": 32820, "total_steps": 33920, "loss": 0.2713, "lr": 3.2059226114132815e-08, "epoch": 19.35141509433962, "percentage": 96.76, "elapsed_time": "1:03:16", "remaining_time": "0:02:07", "throughput": 5641.62, "total_tokens": 21417928} {"current_steps": 32825, "total_steps": 33920, "loss": 0.2296, "lr": 3.1769012539945575e-08, "epoch": 19.35436320754717, "percentage": 96.77, "elapsed_time": "1:03:16", "remaining_time": "0:02:06", "throughput": 5641.48, "total_tokens": 21420136} {"current_steps": 32830, "total_steps": 33920, "loss": 0.3328, "lr": 3.1480114326324364e-08, "epoch": 19.357311320754718, "percentage": 96.79, "elapsed_time": "1:03:17", "remaining_time": "0:02:06", "throughput": 5641.3, "total_tokens": 21422408} {"current_steps": 32835, "total_steps": 33920, "loss": 0.2794, "lr": 3.1192531549756325e-08, "epoch": 19.360259433962263, "percentage": 96.8, "elapsed_time": "1:03:17", "remaining_time": "0:02:05", "throughput": 5641.28, "total_tokens": 21425352} {"current_steps": 32840, "total_steps": 33920, "loss": 0.4428, "lr": 3.090626428638e-08, "epoch": 19.36320754716981, "percentage": 96.82, "elapsed_time": "1:03:18", "remaining_time": "0:02:04", "throughput": 5641.3, "total_tokens": 21428392} {"current_steps": 32845, "total_steps": 33920, "loss": 0.33, "lr": 3.062131261198531e-08, "epoch": 19.36615566037736, "percentage": 96.83, "elapsed_time": "1:03:19", "remaining_time": "0:02:04", "throughput": 5641.28, "total_tokens": 21431272} {"current_steps": 32850, "total_steps": 33920, "loss": 0.3193, "lr": 3.033767660201525e-08, "epoch": 19.369103773584907, "percentage": 96.85, "elapsed_time": "1:03:19", "remaining_time": "0:02:03", "throughput": 5641.27, "total_tokens": 21434248} {"current_steps": 32855, "total_steps": 33920, "loss": 0.1988, "lr": 3.005535633156309e-08, "epoch": 19.372051886792452, "percentage": 96.86, "elapsed_time": "1:03:20", "remaining_time": "0:02:03", "throughput": 5641.29, "total_tokens": 21437320} {"current_steps": 32860, "total_steps": 33920, "loss": 0.2124, "lr": 2.977435187537514e-08, "epoch": 19.375, "percentage": 96.88, "elapsed_time": "1:03:20", "remaining_time": "0:02:02", "throughput": 5641.35, "total_tokens": 21440552} {"current_steps": 32865, "total_steps": 33920, "loss": 0.2473, "lr": 2.949466330784745e-08, "epoch": 19.377948113207548, "percentage": 96.89, "elapsed_time": "1:03:21", "remaining_time": "0:02:02", "throughput": 5641.52, "total_tokens": 21444488} {"current_steps": 32870, "total_steps": 33920, "loss": 0.3404, "lr": 2.921629070302967e-08, "epoch": 19.380896226415093, "percentage": 96.9, "elapsed_time": "1:03:21", "remaining_time": "0:02:01", "throughput": 5641.51, "total_tokens": 21447304} {"current_steps": 32875, "total_steps": 33920, "loss": 0.3005, "lr": 2.893923413462174e-08, "epoch": 19.38384433962264, "percentage": 96.92, "elapsed_time": "1:03:22", "remaining_time": "0:02:00", "throughput": 5641.52, "total_tokens": 21450152} {"current_steps": 32880, "total_steps": 33920, "loss": 0.3742, "lr": 2.866349367597554e-08, "epoch": 19.38679245283019, "percentage": 96.93, "elapsed_time": "1:03:22", "remaining_time": "0:02:00", "throughput": 5641.41, "total_tokens": 21452744} {"current_steps": 32885, "total_steps": 33920, "loss": 0.3459, "lr": 2.8389069400094893e-08, "epoch": 19.389740566037737, "percentage": 96.95, "elapsed_time": "1:03:23", "remaining_time": "0:01:59", "throughput": 5641.58, "total_tokens": 21457224} {"current_steps": 32890, "total_steps": 33920, "loss": 0.2872, "lr": 2.811596137963446e-08, "epoch": 19.392688679245282, "percentage": 96.96, "elapsed_time": "1:03:23", "remaining_time": "0:01:59", "throughput": 5641.65, "total_tokens": 21460616} {"current_steps": 32895, "total_steps": 33920, "loss": 0.2755, "lr": 2.7844169686900844e-08, "epoch": 19.39563679245283, "percentage": 96.98, "elapsed_time": "1:03:24", "remaining_time": "0:01:58", "throughput": 5641.79, "total_tokens": 21464488} {"current_steps": 32900, "total_steps": 33920, "loss": 0.2681, "lr": 2.7573694393852047e-08, "epoch": 19.39858490566038, "percentage": 96.99, "elapsed_time": "1:03:25", "remaining_time": "0:01:57", "throughput": 5641.87, "total_tokens": 21467720} {"current_steps": 32905, "total_steps": 33920, "loss": 0.3072, "lr": 2.7304535572098e-08, "epoch": 19.401533018867923, "percentage": 97.01, "elapsed_time": "1:03:25", "remaining_time": "0:01:57", "throughput": 5641.86, "total_tokens": 21470600} {"current_steps": 32910, "total_steps": 33920, "loss": 0.253, "lr": 2.703669329289893e-08, "epoch": 19.40448113207547, "percentage": 97.02, "elapsed_time": "1:03:26", "remaining_time": "0:01:56", "throughput": 5641.86, "total_tokens": 21473992} {"current_steps": 32915, "total_steps": 33920, "loss": 0.4588, "lr": 2.6770167627167554e-08, "epoch": 19.40742924528302, "percentage": 97.04, "elapsed_time": "1:03:26", "remaining_time": "0:01:56", "throughput": 5641.96, "total_tokens": 21477672} {"current_steps": 32920, "total_steps": 33920, "loss": 0.3745, "lr": 2.6504958645467426e-08, "epoch": 19.410377358490567, "percentage": 97.05, "elapsed_time": "1:03:27", "remaining_time": "0:01:55", "throughput": 5641.97, "total_tokens": 21480648} {"current_steps": 32925, "total_steps": 33920, "loss": 0.2767, "lr": 2.6241066418014605e-08, "epoch": 19.413325471698112, "percentage": 97.07, "elapsed_time": "1:03:27", "remaining_time": "0:01:55", "throughput": 5641.84, "total_tokens": 21483208} {"current_steps": 32930, "total_steps": 33920, "loss": 0.1813, "lr": 2.5978491014674866e-08, "epoch": 19.41627358490566, "percentage": 97.08, "elapsed_time": "1:03:28", "remaining_time": "0:01:54", "throughput": 5641.9, "total_tokens": 21486504} {"current_steps": 32935, "total_steps": 33920, "loss": 0.2385, "lr": 2.571723250496705e-08, "epoch": 19.41922169811321, "percentage": 97.1, "elapsed_time": "1:03:28", "remaining_time": "0:01:53", "throughput": 5642.01, "total_tokens": 21490024} {"current_steps": 32940, "total_steps": 33920, "loss": 0.2529, "lr": 2.5457290958059155e-08, "epoch": 19.422169811320753, "percentage": 97.11, "elapsed_time": "1:03:29", "remaining_time": "0:01:53", "throughput": 5642.11, "total_tokens": 21493704} {"current_steps": 32945, "total_steps": 33920, "loss": 0.2939, "lr": 2.51986664427728e-08, "epoch": 19.4251179245283, "percentage": 97.13, "elapsed_time": "1:03:30", "remaining_time": "0:01:52", "throughput": 5642.15, "total_tokens": 21497448} {"current_steps": 32950, "total_steps": 33920, "loss": 0.474, "lr": 2.4941359027579883e-08, "epoch": 19.42806603773585, "percentage": 97.14, "elapsed_time": "1:03:30", "remaining_time": "0:01:52", "throughput": 5642.15, "total_tokens": 21500520} {"current_steps": 32955, "total_steps": 33920, "loss": 0.2568, "lr": 2.468536878060368e-08, "epoch": 19.431014150943398, "percentage": 97.16, "elapsed_time": "1:03:31", "remaining_time": "0:01:51", "throughput": 5642.23, "total_tokens": 21503784} {"current_steps": 32960, "total_steps": 33920, "loss": 0.3477, "lr": 2.443069576961832e-08, "epoch": 19.433962264150942, "percentage": 97.17, "elapsed_time": "1:03:31", "remaining_time": "0:01:51", "throughput": 5642.3, "total_tokens": 21507048} {"current_steps": 32965, "total_steps": 33920, "loss": 0.265, "lr": 2.4177340062049304e-08, "epoch": 19.43691037735849, "percentage": 97.18, "elapsed_time": "1:03:32", "remaining_time": "0:01:50", "throughput": 5642.21, "total_tokens": 21509512} {"current_steps": 32970, "total_steps": 33920, "loss": 0.3565, "lr": 2.3925301724974647e-08, "epoch": 19.43985849056604, "percentage": 97.2, "elapsed_time": "1:03:32", "remaining_time": "0:01:49", "throughput": 5642.13, "total_tokens": 21512232} {"current_steps": 32975, "total_steps": 33920, "loss": 0.2231, "lr": 2.367458082512153e-08, "epoch": 19.442806603773583, "percentage": 97.21, "elapsed_time": "1:03:33", "remaining_time": "0:01:49", "throughput": 5642.12, "total_tokens": 21515464} {"current_steps": 32980, "total_steps": 33920, "loss": 0.2759, "lr": 2.3425177428870737e-08, "epoch": 19.44575471698113, "percentage": 97.23, "elapsed_time": "1:03:33", "remaining_time": "0:01:48", "throughput": 5642.12, "total_tokens": 21518312} {"current_steps": 32985, "total_steps": 33920, "loss": 0.2931, "lr": 2.3177091602251677e-08, "epoch": 19.44870283018868, "percentage": 97.24, "elapsed_time": "1:03:34", "remaining_time": "0:01:48", "throughput": 5642.2, "total_tokens": 21521576} {"current_steps": 32990, "total_steps": 33920, "loss": 0.2695, "lr": 2.2930323410946254e-08, "epoch": 19.451650943396228, "percentage": 97.26, "elapsed_time": "1:03:35", "remaining_time": "0:01:47", "throughput": 5642.33, "total_tokens": 21525640} {"current_steps": 32995, "total_steps": 33920, "loss": 0.3224, "lr": 2.2684872920287758e-08, "epoch": 19.454599056603772, "percentage": 97.27, "elapsed_time": "1:03:35", "remaining_time": "0:01:46", "throughput": 5642.48, "total_tokens": 21529608} {"current_steps": 33000, "total_steps": 33920, "loss": 0.3279, "lr": 2.2440740195260323e-08, "epoch": 19.45754716981132, "percentage": 97.29, "elapsed_time": "1:03:36", "remaining_time": "0:01:46", "throughput": 5642.51, "total_tokens": 21532840} {"current_steps": 33005, "total_steps": 33920, "loss": 0.4382, "lr": 2.219792530049891e-08, "epoch": 19.46049528301887, "percentage": 97.3, "elapsed_time": "1:03:37", "remaining_time": "0:01:45", "throughput": 5642.65, "total_tokens": 21538696} {"current_steps": 33010, "total_steps": 33920, "loss": 0.2382, "lr": 2.1956428300290434e-08, "epoch": 19.463443396226417, "percentage": 97.32, "elapsed_time": "1:03:37", "remaining_time": "0:01:45", "throughput": 5642.69, "total_tokens": 21542216} {"current_steps": 33015, "total_steps": 33920, "loss": 0.3048, "lr": 2.1716249258570966e-08, "epoch": 19.46639150943396, "percentage": 97.33, "elapsed_time": "1:03:38", "remaining_time": "0:01:44", "throughput": 5642.62, "total_tokens": 21544808} {"current_steps": 33020, "total_steps": 33920, "loss": 0.2526, "lr": 2.1477388238930196e-08, "epoch": 19.46933962264151, "percentage": 97.35, "elapsed_time": "1:03:38", "remaining_time": "0:01:44", "throughput": 5642.69, "total_tokens": 21548552} {"current_steps": 33025, "total_steps": 33920, "loss": 0.3218, "lr": 2.1239845304606988e-08, "epoch": 19.472287735849058, "percentage": 97.36, "elapsed_time": "1:03:39", "remaining_time": "0:01:43", "throughput": 5642.64, "total_tokens": 21551272} {"current_steps": 33030, "total_steps": 33920, "loss": 0.3461, "lr": 2.100362051849214e-08, "epoch": 19.475235849056602, "percentage": 97.38, "elapsed_time": "1:03:39", "remaining_time": "0:01:42", "throughput": 5642.71, "total_tokens": 21554952} {"current_steps": 33035, "total_steps": 33920, "loss": 0.2865, "lr": 2.076871394312674e-08, "epoch": 19.47818396226415, "percentage": 97.39, "elapsed_time": "1:03:40", "remaining_time": "0:01:42", "throughput": 5642.81, "total_tokens": 21558952} {"current_steps": 33040, "total_steps": 33920, "loss": 0.3412, "lr": 2.0535125640703813e-08, "epoch": 19.4811320754717, "percentage": 97.41, "elapsed_time": "1:03:41", "remaining_time": "0:01:41", "throughput": 5642.78, "total_tokens": 21561800} {"current_steps": 33045, "total_steps": 33920, "loss": 0.2964, "lr": 2.0302855673066667e-08, "epoch": 19.484080188679247, "percentage": 97.42, "elapsed_time": "1:03:41", "remaining_time": "0:01:41", "throughput": 5642.68, "total_tokens": 21564616} {"current_steps": 33050, "total_steps": 33920, "loss": 0.271, "lr": 2.0071904101710004e-08, "epoch": 19.48702830188679, "percentage": 97.44, "elapsed_time": "1:03:42", "remaining_time": "0:01:40", "throughput": 5642.65, "total_tokens": 21567240} {"current_steps": 33055, "total_steps": 33920, "loss": 0.4516, "lr": 1.98422709877788e-08, "epoch": 19.48997641509434, "percentage": 97.45, "elapsed_time": "1:03:42", "remaining_time": "0:01:40", "throughput": 5642.56, "total_tokens": 21569896} {"current_steps": 33060, "total_steps": 33920, "loss": 0.3562, "lr": 1.961395639206942e-08, "epoch": 19.492924528301888, "percentage": 97.46, "elapsed_time": "1:03:43", "remaining_time": "0:01:39", "throughput": 5642.56, "total_tokens": 21573064} {"current_steps": 33065, "total_steps": 33920, "loss": 0.201, "lr": 1.9386960375029628e-08, "epoch": 19.495872641509433, "percentage": 97.48, "elapsed_time": "1:03:43", "remaining_time": "0:01:38", "throughput": 5642.62, "total_tokens": 21576232} {"current_steps": 33070, "total_steps": 33920, "loss": 0.3357, "lr": 1.9161282996757458e-08, "epoch": 19.49882075471698, "percentage": 97.49, "elapsed_time": "1:03:44", "remaining_time": "0:01:38", "throughput": 5642.66, "total_tokens": 21579208} {"current_steps": 33075, "total_steps": 33920, "loss": 0.3204, "lr": 1.8936924317001225e-08, "epoch": 19.50176886792453, "percentage": 97.51, "elapsed_time": "1:03:44", "remaining_time": "0:01:37", "throughput": 5642.73, "total_tokens": 21582504} {"current_steps": 33080, "total_steps": 33920, "loss": 0.179, "lr": 1.8713884395162308e-08, "epoch": 19.504716981132077, "percentage": 97.52, "elapsed_time": "1:03:45", "remaining_time": "0:01:37", "throughput": 5642.7, "total_tokens": 21585416} {"current_steps": 33085, "total_steps": 33920, "loss": 0.4274, "lr": 1.8492163290290132e-08, "epoch": 19.50766509433962, "percentage": 97.54, "elapsed_time": "1:03:45", "remaining_time": "0:01:36", "throughput": 5642.76, "total_tokens": 21588488} {"current_steps": 33090, "total_steps": 33920, "loss": 0.3146, "lr": 1.827176106108719e-08, "epoch": 19.51061320754717, "percentage": 97.55, "elapsed_time": "1:03:46", "remaining_time": "0:01:35", "throughput": 5642.81, "total_tokens": 21591592} {"current_steps": 33095, "total_steps": 33920, "loss": 0.3905, "lr": 1.8052677765905137e-08, "epoch": 19.513561320754718, "percentage": 97.57, "elapsed_time": "1:03:47", "remaining_time": "0:01:35", "throughput": 5642.89, "total_tokens": 21595432} {"current_steps": 33100, "total_steps": 33920, "loss": 0.3075, "lr": 1.783491346274757e-08, "epoch": 19.516509433962263, "percentage": 97.58, "elapsed_time": "1:03:47", "remaining_time": "0:01:34", "throughput": 5642.78, "total_tokens": 21597864} {"current_steps": 33105, "total_steps": 33920, "loss": 0.2955, "lr": 1.7618468209268936e-08, "epoch": 19.51945754716981, "percentage": 97.6, "elapsed_time": "1:03:48", "remaining_time": "0:01:34", "throughput": 5642.79, "total_tokens": 21600712} {"current_steps": 33110, "total_steps": 33920, "loss": 0.2128, "lr": 1.7403342062773943e-08, "epoch": 19.52240566037736, "percentage": 97.61, "elapsed_time": "1:03:48", "remaining_time": "0:01:33", "throughput": 5643.05, "total_tokens": 21606216} {"current_steps": 33115, "total_steps": 33920, "loss": 0.3772, "lr": 1.718953508021759e-08, "epoch": 19.525353773584907, "percentage": 97.63, "elapsed_time": "1:03:49", "remaining_time": "0:01:33", "throughput": 5643.14, "total_tokens": 21609768} {"current_steps": 33120, "total_steps": 33920, "loss": 0.4107, "lr": 1.6977047318206262e-08, "epoch": 19.528301886792452, "percentage": 97.64, "elapsed_time": "1:03:49", "remaining_time": "0:01:32", "throughput": 5643.06, "total_tokens": 21612200} {"current_steps": 33125, "total_steps": 33920, "loss": 0.3996, "lr": 1.676587883299774e-08, "epoch": 19.53125, "percentage": 97.66, "elapsed_time": "1:03:50", "remaining_time": "0:01:31", "throughput": 5643.16, "total_tokens": 21615752} {"current_steps": 33130, "total_steps": 33920, "loss": 0.2302, "lr": 1.655602968049952e-08, "epoch": 19.534198113207548, "percentage": 97.67, "elapsed_time": "1:03:50", "remaining_time": "0:01:31", "throughput": 5643.23, "total_tokens": 21618888} {"current_steps": 33135, "total_steps": 33920, "loss": 0.3375, "lr": 1.634749991626938e-08, "epoch": 19.537146226415093, "percentage": 97.69, "elapsed_time": "1:03:51", "remaining_time": "0:01:30", "throughput": 5643.12, "total_tokens": 21621352} {"current_steps": 33140, "total_steps": 33920, "loss": 0.3306, "lr": 1.6140289595517056e-08, "epoch": 19.54009433962264, "percentage": 97.7, "elapsed_time": "1:03:52", "remaining_time": "0:01:30", "throughput": 5643.32, "total_tokens": 21625960} {"current_steps": 33145, "total_steps": 33920, "loss": 0.3775, "lr": 1.5934398773102545e-08, "epoch": 19.54304245283019, "percentage": 97.72, "elapsed_time": "1:03:52", "remaining_time": "0:01:29", "throughput": 5643.41, "total_tokens": 21629480} {"current_steps": 33150, "total_steps": 33920, "loss": 0.325, "lr": 1.5729827503536133e-08, "epoch": 19.545990566037737, "percentage": 97.73, "elapsed_time": "1:03:53", "remaining_time": "0:01:29", "throughput": 5643.5, "total_tokens": 21633160} {"current_steps": 33155, "total_steps": 33920, "loss": 0.2864, "lr": 1.5526575840978942e-08, "epoch": 19.548938679245282, "percentage": 97.74, "elapsed_time": "1:03:53", "remaining_time": "0:01:28", "throughput": 5643.45, "total_tokens": 21635752} {"current_steps": 33160, "total_steps": 33920, "loss": 0.1994, "lr": 1.532464383924237e-08, "epoch": 19.55188679245283, "percentage": 97.76, "elapsed_time": "1:03:54", "remaining_time": "0:01:27", "throughput": 5643.49, "total_tokens": 21638792} {"current_steps": 33165, "total_steps": 33920, "loss": 0.3359, "lr": 1.5124031551789208e-08, "epoch": 19.55483490566038, "percentage": 97.77, "elapsed_time": "1:03:54", "remaining_time": "0:01:27", "throughput": 5643.51, "total_tokens": 21641672} {"current_steps": 33170, "total_steps": 33920, "loss": 0.3339, "lr": 1.4924739031732527e-08, "epoch": 19.557783018867923, "percentage": 97.79, "elapsed_time": "1:03:55", "remaining_time": "0:01:26", "throughput": 5643.47, "total_tokens": 21644232} {"current_steps": 33175, "total_steps": 33920, "loss": 0.3654, "lr": 1.4726766331835118e-08, "epoch": 19.56073113207547, "percentage": 97.8, "elapsed_time": "1:03:55", "remaining_time": "0:01:26", "throughput": 5643.56, "total_tokens": 21647624} {"current_steps": 33180, "total_steps": 33920, "loss": 0.2071, "lr": 1.4530113504512278e-08, "epoch": 19.56367924528302, "percentage": 97.82, "elapsed_time": "1:03:56", "remaining_time": "0:01:25", "throughput": 5643.52, "total_tokens": 21650152} {"current_steps": 33185, "total_steps": 33920, "loss": 0.3733, "lr": 1.4334780601827914e-08, "epoch": 19.566627358490567, "percentage": 97.83, "elapsed_time": "1:03:56", "remaining_time": "0:01:24", "throughput": 5643.61, "total_tokens": 21653608} {"current_steps": 33190, "total_steps": 33920, "loss": 0.3154, "lr": 1.4140767675497325e-08, "epoch": 19.569575471698112, "percentage": 97.85, "elapsed_time": "1:03:57", "remaining_time": "0:01:24", "throughput": 5643.78, "total_tokens": 21658120} {"current_steps": 33195, "total_steps": 33920, "loss": 0.1911, "lr": 1.394807477688609e-08, "epoch": 19.57252358490566, "percentage": 97.86, "elapsed_time": "1:03:58", "remaining_time": "0:01:23", "throughput": 5643.85, "total_tokens": 21661480} {"current_steps": 33200, "total_steps": 33920, "loss": 0.2926, "lr": 1.3756701957011177e-08, "epoch": 19.57547169811321, "percentage": 97.88, "elapsed_time": "1:03:58", "remaining_time": "0:01:23", "throughput": 5643.87, "total_tokens": 21664456} {"current_steps": 33205, "total_steps": 33920, "loss": 0.2349, "lr": 1.3566649266538723e-08, "epoch": 19.578419811320753, "percentage": 97.89, "elapsed_time": "1:03:59", "remaining_time": "0:01:22", "throughput": 5643.92, "total_tokens": 21667592} {"current_steps": 33210, "total_steps": 33920, "loss": 0.3306, "lr": 1.3377916755786257e-08, "epoch": 19.5813679245283, "percentage": 97.91, "elapsed_time": "1:03:59", "remaining_time": "0:01:22", "throughput": 5643.89, "total_tokens": 21670536} {"current_steps": 33215, "total_steps": 33920, "loss": 0.2972, "lr": 1.3190504474721588e-08, "epoch": 19.58431603773585, "percentage": 97.92, "elapsed_time": "1:04:00", "remaining_time": "0:01:21", "throughput": 5643.88, "total_tokens": 21673256} {"current_steps": 33220, "total_steps": 33920, "loss": 0.2841, "lr": 1.3004412472962802e-08, "epoch": 19.587264150943398, "percentage": 97.94, "elapsed_time": "1:04:00", "remaining_time": "0:01:20", "throughput": 5643.91, "total_tokens": 21676424} {"current_steps": 33225, "total_steps": 33920, "loss": 0.2338, "lr": 1.2819640799778266e-08, "epoch": 19.590212264150942, "percentage": 97.95, "elapsed_time": "1:04:01", "remaining_time": "0:01:20", "throughput": 5643.91, "total_tokens": 21679528} {"current_steps": 33230, "total_steps": 33920, "loss": 0.3074, "lr": 1.2636189504087737e-08, "epoch": 19.59316037735849, "percentage": 97.97, "elapsed_time": "1:04:01", "remaining_time": "0:01:19", "throughput": 5643.85, "total_tokens": 21682088} {"current_steps": 33235, "total_steps": 33920, "loss": 0.281, "lr": 1.2454058634460142e-08, "epoch": 19.59610849056604, "percentage": 97.98, "elapsed_time": "1:04:02", "remaining_time": "0:01:19", "throughput": 5643.86, "total_tokens": 21685192} {"current_steps": 33240, "total_steps": 33920, "loss": 0.3018, "lr": 1.2273248239115798e-08, "epoch": 19.599056603773583, "percentage": 98.0, "elapsed_time": "1:04:02", "remaining_time": "0:01:18", "throughput": 5643.82, "total_tokens": 21687912} {"current_steps": 33245, "total_steps": 33920, "loss": 0.2699, "lr": 1.2093758365924746e-08, "epoch": 19.60200471698113, "percentage": 98.01, "elapsed_time": "1:04:03", "remaining_time": "0:01:18", "throughput": 5643.93, "total_tokens": 21691560} {"current_steps": 33250, "total_steps": 33920, "loss": 0.3169, "lr": 1.1915589062408417e-08, "epoch": 19.60495283018868, "percentage": 98.02, "elapsed_time": "1:04:03", "remaining_time": "0:01:17", "throughput": 5643.99, "total_tokens": 21694696} {"current_steps": 33255, "total_steps": 33920, "loss": 0.2779, "lr": 1.1738740375736301e-08, "epoch": 19.607900943396228, "percentage": 98.04, "elapsed_time": "1:04:04", "remaining_time": "0:01:16", "throughput": 5644.09, "total_tokens": 21698344} {"current_steps": 33260, "total_steps": 33920, "loss": 0.2563, "lr": 1.15632123527315e-08, "epoch": 19.610849056603772, "percentage": 98.05, "elapsed_time": "1:04:05", "remaining_time": "0:01:16", "throughput": 5644.16, "total_tokens": 21702024} {"current_steps": 33265, "total_steps": 33920, "loss": 0.2604, "lr": 1.1389005039865176e-08, "epoch": 19.61379716981132, "percentage": 98.07, "elapsed_time": "1:04:05", "remaining_time": "0:01:15", "throughput": 5644.28, "total_tokens": 21705736} {"current_steps": 33270, "total_steps": 33920, "loss": 0.3332, "lr": 1.1216118483259875e-08, "epoch": 19.61674528301887, "percentage": 98.08, "elapsed_time": "1:04:06", "remaining_time": "0:01:15", "throughput": 5644.32, "total_tokens": 21708808} {"current_steps": 33275, "total_steps": 33920, "loss": 0.3127, "lr": 1.1044552728687319e-08, "epoch": 19.619693396226417, "percentage": 98.1, "elapsed_time": "1:04:06", "remaining_time": "0:01:14", "throughput": 5644.2, "total_tokens": 21711112} {"current_steps": 33280, "total_steps": 33920, "loss": 0.3657, "lr": 1.0874307821570618e-08, "epoch": 19.62264150943396, "percentage": 98.11, "elapsed_time": "1:04:07", "remaining_time": "0:01:13", "throughput": 5644.26, "total_tokens": 21714600} {"current_steps": 33285, "total_steps": 33920, "loss": 0.2756, "lr": 1.0705383806982606e-08, "epoch": 19.62558962264151, "percentage": 98.13, "elapsed_time": "1:04:07", "remaining_time": "0:01:13", "throughput": 5644.36, "total_tokens": 21717992} {"current_steps": 33290, "total_steps": 33920, "loss": 0.1905, "lr": 1.0537780729646952e-08, "epoch": 19.628537735849058, "percentage": 98.14, "elapsed_time": "1:04:08", "remaining_time": "0:01:12", "throughput": 5644.25, "total_tokens": 21720392} {"current_steps": 33295, "total_steps": 33920, "loss": 0.357, "lr": 1.0371498633937605e-08, "epoch": 19.631485849056602, "percentage": 98.16, "elapsed_time": "1:04:08", "remaining_time": "0:01:12", "throughput": 5644.23, "total_tokens": 21723528} {"current_steps": 33300, "total_steps": 33920, "loss": 0.2156, "lr": 1.0206537563877683e-08, "epoch": 19.63443396226415, "percentage": 98.17, "elapsed_time": "1:04:09", "remaining_time": "0:01:11", "throughput": 5644.24, "total_tokens": 21726600} {"current_steps": 33305, "total_steps": 33920, "loss": 0.2274, "lr": 1.0042897563141695e-08, "epoch": 19.6373820754717, "percentage": 98.19, "elapsed_time": "1:04:09", "remaining_time": "0:01:11", "throughput": 5644.25, "total_tokens": 21729608} {"current_steps": 33310, "total_steps": 33920, "loss": 0.3439, "lr": 9.88057867505443e-09, "epoch": 19.640330188679247, "percentage": 98.2, "elapsed_time": "1:04:10", "remaining_time": "0:01:10", "throughput": 5644.31, "total_tokens": 21732904} {"current_steps": 33315, "total_steps": 33920, "loss": 0.4144, "lr": 9.7195809425904e-09, "epoch": 19.64327830188679, "percentage": 98.22, "elapsed_time": "1:04:10", "remaining_time": "0:01:09", "throughput": 5644.2, "total_tokens": 21735496} {"current_steps": 33320, "total_steps": 33920, "loss": 0.2932, "lr": 9.559904408373844e-09, "epoch": 19.64622641509434, "percentage": 98.23, "elapsed_time": "1:04:11", "remaining_time": "0:01:09", "throughput": 5644.13, "total_tokens": 21738024} {"current_steps": 33325, "total_steps": 33920, "loss": 0.2104, "lr": 9.401549114680387e-09, "epoch": 19.649174528301888, "percentage": 98.25, "elapsed_time": "1:04:12", "remaining_time": "0:01:08", "throughput": 5644.29, "total_tokens": 21742280} {"current_steps": 33330, "total_steps": 33920, "loss": 0.2711, "lr": 9.244515103434826e-09, "epoch": 19.652122641509433, "percentage": 98.26, "elapsed_time": "1:04:12", "remaining_time": "0:01:08", "throughput": 5644.33, "total_tokens": 21745416} {"current_steps": 33335, "total_steps": 33920, "loss": 0.2808, "lr": 9.08880241621335e-09, "epoch": 19.65507075471698, "percentage": 98.28, "elapsed_time": "1:04:13", "remaining_time": "0:01:07", "throughput": 5644.53, "total_tokens": 21750344} {"current_steps": 33340, "total_steps": 33920, "loss": 0.3335, "lr": 8.934411094240758e-09, "epoch": 19.65801886792453, "percentage": 98.29, "elapsed_time": "1:04:13", "remaining_time": "0:01:07", "throughput": 5644.58, "total_tokens": 21754152} {"current_steps": 33345, "total_steps": 33920, "loss": 0.3372, "lr": 8.781341178393244e-09, "epoch": 19.660966981132077, "percentage": 98.3, "elapsed_time": "1:04:14", "remaining_time": "0:01:06", "throughput": 5644.69, "total_tokens": 21757800} {"current_steps": 33350, "total_steps": 33920, "loss": 0.3472, "lr": 8.629592709196167e-09, "epoch": 19.66391509433962, "percentage": 98.32, "elapsed_time": "1:04:15", "remaining_time": "0:01:05", "throughput": 5644.7, "total_tokens": 21760808} {"current_steps": 33355, "total_steps": 33920, "loss": 0.2646, "lr": 8.479165726826277e-09, "epoch": 19.66686320754717, "percentage": 98.33, "elapsed_time": "1:04:15", "remaining_time": "0:01:05", "throughput": 5644.58, "total_tokens": 21763848} {"current_steps": 33360, "total_steps": 33920, "loss": 0.3371, "lr": 8.330060271109496e-09, "epoch": 19.669811320754718, "percentage": 98.35, "elapsed_time": "1:04:16", "remaining_time": "0:01:04", "throughput": 5644.63, "total_tokens": 21766856} {"current_steps": 33365, "total_steps": 33920, "loss": 0.2962, "lr": 8.18227638152258e-09, "epoch": 19.672759433962263, "percentage": 98.36, "elapsed_time": "1:04:16", "remaining_time": "0:01:04", "throughput": 5644.65, "total_tokens": 21770088} {"current_steps": 33370, "total_steps": 33920, "loss": 0.3431, "lr": 8.035814097191452e-09, "epoch": 19.67570754716981, "percentage": 98.38, "elapsed_time": "1:04:17", "remaining_time": "0:01:03", "throughput": 5644.69, "total_tokens": 21773128} {"current_steps": 33375, "total_steps": 33920, "loss": 0.294, "lr": 7.890673456892317e-09, "epoch": 19.67865566037736, "percentage": 98.39, "elapsed_time": "1:04:17", "remaining_time": "0:01:02", "throughput": 5644.7, "total_tokens": 21776296} {"current_steps": 33380, "total_steps": 33920, "loss": 0.2832, "lr": 7.746854499052215e-09, "epoch": 19.681603773584907, "percentage": 98.41, "elapsed_time": "1:04:18", "remaining_time": "0:01:02", "throughput": 5644.64, "total_tokens": 21779176} {"current_steps": 33385, "total_steps": 33920, "loss": 0.4126, "lr": 7.604357261747907e-09, "epoch": 19.684551886792452, "percentage": 98.42, "elapsed_time": "1:04:18", "remaining_time": "0:01:01", "throughput": 5644.74, "total_tokens": 21782632} {"current_steps": 33390, "total_steps": 33920, "loss": 0.3576, "lr": 7.463181782705886e-09, "epoch": 19.6875, "percentage": 98.44, "elapsed_time": "1:04:19", "remaining_time": "0:01:01", "throughput": 5644.65, "total_tokens": 21785512} {"current_steps": 33395, "total_steps": 33920, "loss": 0.3427, "lr": 7.3233280993034726e-09, "epoch": 19.690448113207548, "percentage": 98.45, "elapsed_time": "1:04:20", "remaining_time": "0:01:00", "throughput": 5644.75, "total_tokens": 21789128} {"current_steps": 33400, "total_steps": 33920, "loss": 0.3668, "lr": 7.184796248567161e-09, "epoch": 19.693396226415093, "percentage": 98.47, "elapsed_time": "1:04:20", "remaining_time": "0:01:00", "throughput": 5644.77, "total_tokens": 21792168} {"current_steps": 33405, "total_steps": 33920, "loss": 0.2823, "lr": 7.047586267173723e-09, "epoch": 19.69634433962264, "percentage": 98.48, "elapsed_time": "1:04:21", "remaining_time": "0:00:59", "throughput": 5644.72, "total_tokens": 21794888} {"current_steps": 33410, "total_steps": 33920, "loss": 0.301, "lr": 6.9116981914502114e-09, "epoch": 19.69929245283019, "percentage": 98.5, "elapsed_time": "1:04:21", "remaining_time": "0:00:58", "throughput": 5644.76, "total_tokens": 21798152} {"current_steps": 33415, "total_steps": 33920, "loss": 0.4092, "lr": 6.7771320573734036e-09, "epoch": 19.702240566037737, "percentage": 98.51, "elapsed_time": "1:04:22", "remaining_time": "0:00:58", "throughput": 5644.72, "total_tokens": 21801000} {"current_steps": 33420, "total_steps": 33920, "loss": 0.2337, "lr": 6.6438879005709114e-09, "epoch": 19.705188679245282, "percentage": 98.53, "elapsed_time": "1:04:22", "remaining_time": "0:00:57", "throughput": 5644.8, "total_tokens": 21804392} {"current_steps": 33425, "total_steps": 33920, "loss": 0.398, "lr": 6.511965756318961e-09, "epoch": 19.70813679245283, "percentage": 98.54, "elapsed_time": "1:04:23", "remaining_time": "0:00:57", "throughput": 5644.82, "total_tokens": 21807304} {"current_steps": 33430, "total_steps": 33920, "loss": 0.2455, "lr": 6.381365659545169e-09, "epoch": 19.71108490566038, "percentage": 98.56, "elapsed_time": "1:04:23", "remaining_time": "0:00:56", "throughput": 5645.01, "total_tokens": 21812008} {"current_steps": 33435, "total_steps": 33920, "loss": 0.2908, "lr": 6.252087644825766e-09, "epoch": 19.714033018867923, "percentage": 98.57, "elapsed_time": "1:04:24", "remaining_time": "0:00:56", "throughput": 5644.97, "total_tokens": 21814696} {"current_steps": 33440, "total_steps": 33920, "loss": 0.2589, "lr": 6.124131746388373e-09, "epoch": 19.71698113207547, "percentage": 98.58, "elapsed_time": "1:04:25", "remaining_time": "0:00:55", "throughput": 5645.07, "total_tokens": 21818344} {"current_steps": 33445, "total_steps": 33920, "loss": 0.2833, "lr": 5.997497998109225e-09, "epoch": 19.71992924528302, "percentage": 98.6, "elapsed_time": "1:04:25", "remaining_time": "0:00:54", "throughput": 5645.13, "total_tokens": 21821480} {"current_steps": 33450, "total_steps": 33920, "loss": 0.2268, "lr": 5.8721864335153925e-09, "epoch": 19.722877358490567, "percentage": 98.61, "elapsed_time": "1:04:26", "remaining_time": "0:00:54", "throughput": 5645.32, "total_tokens": 21827240} {"current_steps": 33455, "total_steps": 33920, "loss": 0.1984, "lr": 5.748197085784224e-09, "epoch": 19.725825471698112, "percentage": 98.63, "elapsed_time": "1:04:26", "remaining_time": "0:00:53", "throughput": 5645.35, "total_tokens": 21830440} {"current_steps": 33460, "total_steps": 33920, "loss": 0.3141, "lr": 5.62552998774113e-09, "epoch": 19.72877358490566, "percentage": 98.64, "elapsed_time": "1:04:27", "remaining_time": "0:00:53", "throughput": 5645.33, "total_tokens": 21833320} {"current_steps": 33465, "total_steps": 33920, "loss": 0.337, "lr": 5.504185171864018e-09, "epoch": 19.73172169811321, "percentage": 98.66, "elapsed_time": "1:04:28", "remaining_time": "0:00:52", "throughput": 5645.45, "total_tokens": 21837352} {"current_steps": 33470, "total_steps": 33920, "loss": 0.3542, "lr": 5.384162670278858e-09, "epoch": 19.734669811320753, "percentage": 98.67, "elapsed_time": "1:04:28", "remaining_time": "0:00:52", "throughput": 5645.43, "total_tokens": 21840104} {"current_steps": 33475, "total_steps": 33920, "loss": 0.279, "lr": 5.265462514762454e-09, "epoch": 19.7376179245283, "percentage": 98.69, "elapsed_time": "1:04:29", "remaining_time": "0:00:51", "throughput": 5645.42, "total_tokens": 21842856} {"current_steps": 33480, "total_steps": 33920, "loss": 0.3237, "lr": 5.148084736740777e-09, "epoch": 19.74056603773585, "percentage": 98.7, "elapsed_time": "1:04:29", "remaining_time": "0:00:50", "throughput": 5645.51, "total_tokens": 21845992} {"current_steps": 33485, "total_steps": 33920, "loss": 0.311, "lr": 5.032029367290081e-09, "epoch": 19.743514150943398, "percentage": 98.72, "elapsed_time": "1:04:30", "remaining_time": "0:00:50", "throughput": 5645.64, "total_tokens": 21849576} {"current_steps": 33490, "total_steps": 33920, "loss": 0.2966, "lr": 4.917296437136898e-09, "epoch": 19.746462264150942, "percentage": 98.73, "elapsed_time": "1:04:30", "remaining_time": "0:00:49", "throughput": 5645.72, "total_tokens": 21852808} {"current_steps": 33495, "total_steps": 33920, "loss": 0.3706, "lr": 4.8038859766569305e-09, "epoch": 19.74941037735849, "percentage": 98.75, "elapsed_time": "1:04:31", "remaining_time": "0:00:49", "throughput": 5645.73, "total_tokens": 21855720} {"current_steps": 33500, "total_steps": 33920, "loss": 0.3162, "lr": 4.691798015876714e-09, "epoch": 19.75235849056604, "percentage": 98.76, "elapsed_time": "1:04:31", "remaining_time": "0:00:48", "throughput": 5645.68, "total_tokens": 21858248} {"current_steps": 33505, "total_steps": 33920, "loss": 0.3158, "lr": 4.581032584470846e-09, "epoch": 19.755306603773583, "percentage": 98.78, "elapsed_time": "1:04:32", "remaining_time": "0:00:47", "throughput": 5645.81, "total_tokens": 21861928} {"current_steps": 33510, "total_steps": 33920, "loss": 0.2533, "lr": 4.471589711766422e-09, "epoch": 19.75825471698113, "percentage": 98.79, "elapsed_time": "1:04:33", "remaining_time": "0:00:47", "throughput": 5646.02, "total_tokens": 21868200} {"current_steps": 33515, "total_steps": 33920, "loss": 0.31, "lr": 4.363469426737487e-09, "epoch": 19.76120283018868, "percentage": 98.81, "elapsed_time": "1:04:33", "remaining_time": "0:00:46", "throughput": 5646.01, "total_tokens": 21871336} {"current_steps": 33520, "total_steps": 33920, "loss": 0.2765, "lr": 4.256671758010588e-09, "epoch": 19.764150943396228, "percentage": 98.82, "elapsed_time": "1:04:34", "remaining_time": "0:00:46", "throughput": 5646.02, "total_tokens": 21874088} {"current_steps": 33525, "total_steps": 33920, "loss": 0.2339, "lr": 4.151196733859775e-09, "epoch": 19.767099056603772, "percentage": 98.84, "elapsed_time": "1:04:34", "remaining_time": "0:00:45", "throughput": 5646.0, "total_tokens": 21876936} {"current_steps": 33530, "total_steps": 33920, "loss": 0.2932, "lr": 4.047044382211041e-09, "epoch": 19.77004716981132, "percentage": 98.85, "elapsed_time": "1:04:35", "remaining_time": "0:00:45", "throughput": 5646.05, "total_tokens": 21880104} {"current_steps": 33535, "total_steps": 33920, "loss": 0.3409, "lr": 3.94421473063844e-09, "epoch": 19.77299528301887, "percentage": 98.86, "elapsed_time": "1:04:35", "remaining_time": "0:00:44", "throughput": 5646.11, "total_tokens": 21883528} {"current_steps": 33540, "total_steps": 33920, "loss": 0.5135, "lr": 3.842707806366863e-09, "epoch": 19.775943396226417, "percentage": 98.88, "elapsed_time": "1:04:36", "remaining_time": "0:00:43", "throughput": 5646.26, "total_tokens": 21887752} {"current_steps": 33545, "total_steps": 33920, "loss": 0.4784, "lr": 3.742523636270368e-09, "epoch": 19.77889150943396, "percentage": 98.89, "elapsed_time": "1:04:37", "remaining_time": "0:00:43", "throughput": 5646.36, "total_tokens": 21891240} {"current_steps": 33550, "total_steps": 33920, "loss": 0.3121, "lr": 3.6436622468738468e-09, "epoch": 19.78183962264151, "percentage": 98.91, "elapsed_time": "1:04:37", "remaining_time": "0:00:42", "throughput": 5646.32, "total_tokens": 21893864} {"current_steps": 33555, "total_steps": 33920, "loss": 0.3719, "lr": 3.546123664350254e-09, "epoch": 19.784787735849058, "percentage": 98.92, "elapsed_time": "1:04:38", "remaining_time": "0:00:42", "throughput": 5646.36, "total_tokens": 21896904} {"current_steps": 33560, "total_steps": 33920, "loss": 0.347, "lr": 3.449907914524486e-09, "epoch": 19.787735849056602, "percentage": 98.94, "elapsed_time": "1:04:38", "remaining_time": "0:00:41", "throughput": 5646.24, "total_tokens": 21899400} {"current_steps": 33565, "total_steps": 33920, "loss": 0.2557, "lr": 3.355015022869501e-09, "epoch": 19.79068396226415, "percentage": 98.95, "elapsed_time": "1:04:39", "remaining_time": "0:00:41", "throughput": 5646.28, "total_tokens": 21902408} {"current_steps": 33570, "total_steps": 33920, "loss": 0.3006, "lr": 3.261445014508535e-09, "epoch": 19.7936320754717, "percentage": 98.97, "elapsed_time": "1:04:39", "remaining_time": "0:00:40", "throughput": 5646.33, "total_tokens": 21905992} {"current_steps": 33575, "total_steps": 33920, "loss": 0.3445, "lr": 3.1691979142145503e-09, "epoch": 19.796580188679247, "percentage": 98.98, "elapsed_time": "1:04:40", "remaining_time": "0:00:39", "throughput": 5646.58, "total_tokens": 21910920} {"current_steps": 33580, "total_steps": 33920, "loss": 0.2323, "lr": 3.078273746410787e-09, "epoch": 19.79952830188679, "percentage": 99.0, "elapsed_time": "1:04:41", "remaining_time": "0:00:39", "throughput": 5646.68, "total_tokens": 21914984} {"current_steps": 33585, "total_steps": 33920, "loss": 0.3341, "lr": 2.988672535169657e-09, "epoch": 19.80247641509434, "percentage": 99.01, "elapsed_time": "1:04:41", "remaining_time": "0:00:38", "throughput": 5646.66, "total_tokens": 21917800} {"current_steps": 33590, "total_steps": 33920, "loss": 0.2924, "lr": 2.9003943042127393e-09, "epoch": 19.805424528301888, "percentage": 99.03, "elapsed_time": "1:04:42", "remaining_time": "0:00:38", "throughput": 5646.65, "total_tokens": 21920680} {"current_steps": 33595, "total_steps": 33920, "loss": 0.3244, "lr": 2.8134390769135598e-09, "epoch": 19.808372641509433, "percentage": 99.04, "elapsed_time": "1:04:42", "remaining_time": "0:00:37", "throughput": 5646.71, "total_tokens": 21923880} {"current_steps": 33600, "total_steps": 33920, "loss": 0.2789, "lr": 2.7278068762925935e-09, "epoch": 19.81132075471698, "percentage": 99.06, "elapsed_time": "1:04:43", "remaining_time": "0:00:36", "throughput": 5646.7, "total_tokens": 21926632} {"current_steps": 33605, "total_steps": 33920, "loss": 0.3285, "lr": 2.6434977250217043e-09, "epoch": 19.81426886792453, "percentage": 99.07, "elapsed_time": "1:04:43", "remaining_time": "0:00:36", "throughput": 5646.68, "total_tokens": 21929544} {"current_steps": 33610, "total_steps": 33920, "loss": 0.2893, "lr": 2.560511645422481e-09, "epoch": 19.817216981132077, "percentage": 99.09, "elapsed_time": "1:04:44", "remaining_time": "0:00:35", "throughput": 5646.7, "total_tokens": 21932424} {"current_steps": 33615, "total_steps": 33920, "loss": 0.3389, "lr": 2.4788486594656825e-09, "epoch": 19.82016509433962, "percentage": 99.1, "elapsed_time": "1:04:44", "remaining_time": "0:00:35", "throughput": 5646.76, "total_tokens": 21935848} {"current_steps": 33620, "total_steps": 33920, "loss": 0.4151, "lr": 2.398508788771792e-09, "epoch": 19.82311320754717, "percentage": 99.12, "elapsed_time": "1:04:45", "remaining_time": "0:00:34", "throughput": 5646.86, "total_tokens": 21939240} {"current_steps": 33625, "total_steps": 33920, "loss": 0.2993, "lr": 2.3194920546110166e-09, "epoch": 19.826061320754718, "percentage": 99.13, "elapsed_time": "1:04:45", "remaining_time": "0:00:34", "throughput": 5646.9, "total_tokens": 21942312} {"current_steps": 33630, "total_steps": 33920, "loss": 0.3233, "lr": 2.2417984779032896e-09, "epoch": 19.829009433962263, "percentage": 99.15, "elapsed_time": "1:04:46", "remaining_time": "0:00:33", "throughput": 5646.94, "total_tokens": 21945800} {"current_steps": 33635, "total_steps": 33920, "loss": 0.3665, "lr": 2.1654280792193782e-09, "epoch": 19.83195754716981, "percentage": 99.16, "elapsed_time": "1:04:46", "remaining_time": "0:00:32", "throughput": 5647.09, "total_tokens": 21949544} {"current_steps": 33640, "total_steps": 33920, "loss": 0.3524, "lr": 2.0903808787769987e-09, "epoch": 19.83490566037736, "percentage": 99.17, "elapsed_time": "1:04:47", "remaining_time": "0:00:32", "throughput": 5647.14, "total_tokens": 21952808} {"current_steps": 33645, "total_steps": 33920, "loss": 0.2926, "lr": 2.0166568964463673e-09, "epoch": 19.837853773584907, "percentage": 99.19, "elapsed_time": "1:04:48", "remaining_time": "0:00:31", "throughput": 5647.41, "total_tokens": 21960040} {"current_steps": 33650, "total_steps": 33920, "loss": 0.2284, "lr": 1.9442561517463153e-09, "epoch": 19.840801886792452, "percentage": 99.2, "elapsed_time": "1:04:49", "remaining_time": "0:00:31", "throughput": 5647.55, "total_tokens": 21963784} {"current_steps": 33655, "total_steps": 33920, "loss": 0.335, "lr": 1.8731786638442886e-09, "epoch": 19.84375, "percentage": 99.22, "elapsed_time": "1:04:49", "remaining_time": "0:00:30", "throughput": 5647.67, "total_tokens": 21967144} {"current_steps": 33660, "total_steps": 33920, "loss": 0.3539, "lr": 1.8034244515591214e-09, "epoch": 19.846698113207548, "percentage": 99.23, "elapsed_time": "1:04:50", "remaining_time": "0:00:30", "throughput": 5647.76, "total_tokens": 21970248} {"current_steps": 33665, "total_steps": 33920, "loss": 0.2825, "lr": 1.7349935333582646e-09, "epoch": 19.849646226415093, "percentage": 99.25, "elapsed_time": "1:04:50", "remaining_time": "0:00:29", "throughput": 5647.86, "total_tokens": 21973448} {"current_steps": 33670, "total_steps": 33920, "loss": 0.2435, "lr": 1.6678859273594471e-09, "epoch": 19.85259433962264, "percentage": 99.26, "elapsed_time": "1:04:51", "remaining_time": "0:00:28", "throughput": 5647.87, "total_tokens": 21976360} {"current_steps": 33675, "total_steps": 33920, "loss": 0.301, "lr": 1.6021016513295683e-09, "epoch": 19.85554245283019, "percentage": 99.28, "elapsed_time": "1:04:51", "remaining_time": "0:00:28", "throughput": 5647.77, "total_tokens": 21979208} {"current_steps": 33680, "total_steps": 33920, "loss": 0.3385, "lr": 1.5376407226846968e-09, "epoch": 19.858490566037737, "percentage": 99.29, "elapsed_time": "1:04:52", "remaining_time": "0:00:27", "throughput": 5647.62, "total_tokens": 21981672} {"current_steps": 33685, "total_steps": 33920, "loss": 0.2773, "lr": 1.4745031584917357e-09, "epoch": 19.861438679245282, "percentage": 99.31, "elapsed_time": "1:04:52", "remaining_time": "0:00:27", "throughput": 5647.41, "total_tokens": 21983944} {"current_steps": 33690, "total_steps": 33920, "loss": 0.2815, "lr": 1.4126889754667583e-09, "epoch": 19.86438679245283, "percentage": 99.32, "elapsed_time": "1:04:53", "remaining_time": "0:00:26", "throughput": 5647.39, "total_tokens": 21987208} {"current_steps": 33695, "total_steps": 33920, "loss": 0.3957, "lr": 1.3521981899750069e-09, "epoch": 19.86733490566038, "percentage": 99.34, "elapsed_time": "1:04:54", "remaining_time": "0:00:26", "throughput": 5647.57, "total_tokens": 21991912} {"current_steps": 33700, "total_steps": 33920, "loss": 0.3726, "lr": 1.293030818032004e-09, "epoch": 19.870283018867923, "percentage": 99.35, "elapsed_time": "1:04:54", "remaining_time": "0:00:25", "throughput": 5647.68, "total_tokens": 21995976} {"current_steps": 33705, "total_steps": 33920, "loss": 0.3954, "lr": 1.2351868753018858e-09, "epoch": 19.87323113207547, "percentage": 99.37, "elapsed_time": "1:04:55", "remaining_time": "0:00:24", "throughput": 5647.73, "total_tokens": 21999144} {"current_steps": 33710, "total_steps": 33920, "loss": 0.189, "lr": 1.1786663770996242e-09, "epoch": 19.87617924528302, "percentage": 99.38, "elapsed_time": "1:04:55", "remaining_time": "0:00:24", "throughput": 5647.78, "total_tokens": 22002216} {"current_steps": 33715, "total_steps": 33920, "loss": 0.3457, "lr": 1.1234693383893602e-09, "epoch": 19.879127358490567, "percentage": 99.4, "elapsed_time": "1:04:56", "remaining_time": "0:00:23", "throughput": 5648.0, "total_tokens": 22007016} {"current_steps": 33720, "total_steps": 33920, "loss": 0.3566, "lr": 1.0695957737844043e-09, "epoch": 19.882075471698112, "percentage": 99.41, "elapsed_time": "1:04:56", "remaining_time": "0:00:23", "throughput": 5648.09, "total_tokens": 22010440} {"current_steps": 33725, "total_steps": 33920, "loss": 0.2645, "lr": 1.0170456975483467e-09, "epoch": 19.88502358490566, "percentage": 99.43, "elapsed_time": "1:04:57", "remaining_time": "0:00:22", "throughput": 5648.15, "total_tokens": 22014088} {"current_steps": 33730, "total_steps": 33920, "loss": 0.3112, "lr": 9.658191235933922e-10, "epoch": 19.88797169811321, "percentage": 99.44, "elapsed_time": "1:04:58", "remaining_time": "0:00:21", "throughput": 5648.2, "total_tokens": 22017352} {"current_steps": 33735, "total_steps": 33920, "loss": 0.295, "lr": 9.159160654825805e-10, "epoch": 19.890919811320753, "percentage": 99.45, "elapsed_time": "1:04:58", "remaining_time": "0:00:21", "throughput": 5648.27, "total_tokens": 22021192} {"current_steps": 33740, "total_steps": 33920, "loss": 0.2125, "lr": 8.673365364281205e-10, "epoch": 19.8938679245283, "percentage": 99.47, "elapsed_time": "1:04:59", "remaining_time": "0:00:20", "throughput": 5648.14, "total_tokens": 22023784} {"current_steps": 33745, "total_steps": 33920, "loss": 0.288, "lr": 8.200805492913911e-10, "epoch": 19.89681603773585, "percentage": 99.48, "elapsed_time": "1:04:59", "remaining_time": "0:00:20", "throughput": 5648.22, "total_tokens": 22027176} {"current_steps": 33750, "total_steps": 33920, "loss": 0.3316, "lr": 7.741481165834952e-10, "epoch": 19.899764150943398, "percentage": 99.5, "elapsed_time": "1:05:00", "remaining_time": "0:00:19", "throughput": 5648.22, "total_tokens": 22030248} {"current_steps": 33755, "total_steps": 33920, "loss": 0.3139, "lr": 7.29539250465261e-10, "epoch": 19.902712264150942, "percentage": 99.51, "elapsed_time": "1:05:00", "remaining_time": "0:00:19", "throughput": 5648.26, "total_tokens": 22033384} {"current_steps": 33760, "total_steps": 33920, "loss": 0.3287, "lr": 6.862539627472409e-10, "epoch": 19.90566037735849, "percentage": 99.53, "elapsed_time": "1:05:01", "remaining_time": "0:00:18", "throughput": 5648.33, "total_tokens": 22037128} {"current_steps": 33765, "total_steps": 33920, "loss": 0.35, "lr": 6.442922648897121e-10, "epoch": 19.90860849056604, "percentage": 99.54, "elapsed_time": "1:05:02", "remaining_time": "0:00:17", "throughput": 5648.31, "total_tokens": 22040264} {"current_steps": 33770, "total_steps": 33920, "loss": 0.3984, "lr": 6.036541680015662e-10, "epoch": 19.911556603773583, "percentage": 99.56, "elapsed_time": "1:05:02", "remaining_time": "0:00:17", "throughput": 5648.18, "total_tokens": 22042472} {"current_steps": 33775, "total_steps": 33920, "loss": 0.3069, "lr": 5.643396828419745e-10, "epoch": 19.91450471698113, "percentage": 99.57, "elapsed_time": "1:05:03", "remaining_time": "0:00:16", "throughput": 5648.24, "total_tokens": 22046088} {"current_steps": 33780, "total_steps": 33920, "loss": 0.3025, "lr": 5.26348819819833e-10, "epoch": 19.91745283018868, "percentage": 99.59, "elapsed_time": "1:05:03", "remaining_time": "0:00:16", "throughput": 5648.27, "total_tokens": 22049192} {"current_steps": 33785, "total_steps": 33920, "loss": 0.2736, "lr": 4.896815889937622e-10, "epoch": 19.920400943396228, "percentage": 99.6, "elapsed_time": "1:05:04", "remaining_time": "0:00:15", "throughput": 5648.3, "total_tokens": 22052776} {"current_steps": 33790, "total_steps": 33920, "loss": 0.3318, "lr": 4.543380000704423e-10, "epoch": 19.923349056603772, "percentage": 99.62, "elapsed_time": "1:05:04", "remaining_time": "0:00:15", "throughput": 5648.34, "total_tokens": 22055752} {"current_steps": 33795, "total_steps": 33920, "loss": 0.2691, "lr": 4.203180624084979e-10, "epoch": 19.92629716981132, "percentage": 99.63, "elapsed_time": "1:05:05", "remaining_time": "0:00:14", "throughput": 5648.39, "total_tokens": 22059048} {"current_steps": 33800, "total_steps": 33920, "loss": 0.3122, "lr": 3.876217850146136e-10, "epoch": 19.92924528301887, "percentage": 99.65, "elapsed_time": "1:05:05", "remaining_time": "0:00:13", "throughput": 5648.56, "total_tokens": 22063176} {"current_steps": 33805, "total_steps": 33920, "loss": 0.3053, "lr": 3.56249176544643e-10, "epoch": 19.932193396226417, "percentage": 99.66, "elapsed_time": "1:05:06", "remaining_time": "0:00:13", "throughput": 5648.65, "total_tokens": 22066952} {"current_steps": 33810, "total_steps": 33920, "loss": 0.3078, "lr": 3.262002453047197e-10, "epoch": 19.93514150943396, "percentage": 99.68, "elapsed_time": "1:05:07", "remaining_time": "0:00:12", "throughput": 5648.75, "total_tokens": 22070312} {"current_steps": 33815, "total_steps": 33920, "loss": 0.4239, "lr": 2.974749992512571e-10, "epoch": 19.93808962264151, "percentage": 99.69, "elapsed_time": "1:05:07", "remaining_time": "0:00:12", "throughput": 5648.74, "total_tokens": 22073608} {"current_steps": 33820, "total_steps": 33920, "loss": 0.2968, "lr": 2.700734459881726e-10, "epoch": 19.941037735849058, "percentage": 99.71, "elapsed_time": "1:05:08", "remaining_time": "0:00:11", "throughput": 5648.66, "total_tokens": 22076264} {"current_steps": 33825, "total_steps": 33920, "loss": 0.3224, "lr": 2.439955927713289e-10, "epoch": 19.943985849056602, "percentage": 99.72, "elapsed_time": "1:05:08", "remaining_time": "0:00:10", "throughput": 5648.63, "total_tokens": 22079624} {"current_steps": 33830, "total_steps": 33920, "loss": 0.3369, "lr": 2.1924144650409263e-10, "epoch": 19.94693396226415, "percentage": 99.73, "elapsed_time": "1:05:09", "remaining_time": "0:00:10", "throughput": 5648.84, "total_tokens": 22084136} {"current_steps": 33835, "total_steps": 33920, "loss": 0.3427, "lr": 1.9581101374066546e-10, "epoch": 19.9498820754717, "percentage": 99.75, "elapsed_time": "1:05:10", "remaining_time": "0:00:09", "throughput": 5648.82, "total_tokens": 22086984} {"current_steps": 33840, "total_steps": 33920, "loss": 0.3402, "lr": 1.7370430068441858e-10, "epoch": 19.952830188679247, "percentage": 99.76, "elapsed_time": "1:05:10", "remaining_time": "0:00:09", "throughput": 5648.95, "total_tokens": 22090760} {"current_steps": 33845, "total_steps": 33920, "loss": 0.2809, "lr": 1.529213131878926e-10, "epoch": 19.95577830188679, "percentage": 99.78, "elapsed_time": "1:05:11", "remaining_time": "0:00:08", "throughput": 5648.92, "total_tokens": 22093544} {"current_steps": 33850, "total_steps": 33920, "loss": 0.2686, "lr": 1.3346205675335288e-10, "epoch": 19.95872641509434, "percentage": 99.79, "elapsed_time": "1:05:11", "remaining_time": "0:00:08", "throughput": 5649.03, "total_tokens": 22097032} {"current_steps": 33855, "total_steps": 33920, "loss": 0.2918, "lr": 1.1532653653334447e-10, "epoch": 19.961674528301888, "percentage": 99.81, "elapsed_time": "1:05:12", "remaining_time": "0:00:07", "throughput": 5649.15, "total_tokens": 22100904} {"current_steps": 33860, "total_steps": 33920, "loss": 0.2894, "lr": 9.85147573284717e-11, "epoch": 19.964622641509433, "percentage": 99.82, "elapsed_time": "1:05:12", "remaining_time": "0:00:06", "throughput": 5649.2, "total_tokens": 22104136} {"current_steps": 33865, "total_steps": 33920, "loss": 0.3854, "lr": 8.302672359072894e-11, "epoch": 19.96757075471698, "percentage": 99.84, "elapsed_time": "1:05:13", "remaining_time": "0:00:06", "throughput": 5649.26, "total_tokens": 22107496} {"current_steps": 33870, "total_steps": 33920, "loss": 0.339, "lr": 6.886243941961468e-11, "epoch": 19.97051886792453, "percentage": 99.85, "elapsed_time": "1:05:13", "remaining_time": "0:00:05", "throughput": 5649.17, "total_tokens": 22109960} {"current_steps": 33875, "total_steps": 33920, "loss": 0.2939, "lr": 5.602190856601741e-11, "epoch": 19.973466981132077, "percentage": 99.87, "elapsed_time": "1:05:14", "remaining_time": "0:00:05", "throughput": 5649.15, "total_tokens": 22113384} {"current_steps": 33880, "total_steps": 33920, "loss": 0.2258, "lr": 4.450513442888493e-11, "epoch": 19.97641509433962, "percentage": 99.88, "elapsed_time": "1:05:14", "remaining_time": "0:00:04", "throughput": 5649.14, "total_tokens": 22116328} {"current_steps": 33885, "total_steps": 33920, "loss": 0.249, "lr": 3.4312120057999886e-11, "epoch": 19.97936320754717, "percentage": 99.9, "elapsed_time": "1:05:15", "remaining_time": "0:00:04", "throughput": 5649.14, "total_tokens": 22119368} {"current_steps": 33890, "total_steps": 33920, "loss": 0.2913, "lr": 2.5442868151204224e-11, "epoch": 19.982311320754718, "percentage": 99.91, "elapsed_time": "1:05:16", "remaining_time": "0:00:03", "throughput": 5649.05, "total_tokens": 22121960} {"current_steps": 33895, "total_steps": 33920, "loss": 0.4277, "lr": 1.7897381057729867e-11, "epoch": 19.985259433962263, "percentage": 99.93, "elapsed_time": "1:05:16", "remaining_time": "0:00:02", "throughput": 5649.07, "total_tokens": 22124904} {"current_steps": 33900, "total_steps": 33920, "loss": 0.2248, "lr": 1.1675660773757813e-11, "epoch": 19.98820754716981, "percentage": 99.94, "elapsed_time": "1:05:17", "remaining_time": "0:00:02", "throughput": 5649.11, "total_tokens": 22127944} {"current_steps": 33905, "total_steps": 33920, "loss": 0.2733, "lr": 6.777708947969253e-12, "epoch": 19.99115566037736, "percentage": 99.96, "elapsed_time": "1:05:17", "remaining_time": "0:00:01", "throughput": 5649.04, "total_tokens": 22130952} {"current_steps": 33910, "total_steps": 33920, "loss": 0.2144, "lr": 3.2035268765495674e-12, "epoch": 19.994103773584907, "percentage": 99.97, "elapsed_time": "1:05:18", "remaining_time": "0:00:01", "throughput": 5648.9, "total_tokens": 22133416} {"current_steps": 33915, "total_steps": 33920, "loss": 0.3743, "lr": 9.531155059638863e-13, "epoch": 19.997051886792452, "percentage": 99.99, "elapsed_time": "1:05:18", "remaining_time": "0:00:00", "throughput": 5648.95, "total_tokens": 22136744} {"current_steps": 33920, "total_steps": 33920, "loss": 0.2493, "lr": 2.6475431291750342e-14, "epoch": 20.0, "percentage": 100.0, "elapsed_time": "1:05:19", "remaining_time": "0:00:00", "throughput": 5648.67, "total_tokens": 22139032} {"current_steps": 33920, "total_steps": 33920, "eval_loss": 0.6312955617904663, "epoch": 20.0, "percentage": 100.0, "elapsed_time": "1:05:38", "remaining_time": "0:00:00", "throughput": 5620.89, "total_tokens": 22139032} {"current_steps": 33920, "total_steps": 33920, "epoch": 20.0, "percentage": 100.0, "elapsed_time": "1:05:41", "remaining_time": "0:00:00", "throughput": 5616.41, "total_tokens": 22139032}