diff --git "a/trainer_log.jsonl" "b/trainer_log.jsonl" --- "a/trainer_log.jsonl" +++ "b/trainer_log.jsonl" @@ -21497,3 +21497,2387 @@ {"current_steps": 107440, "total_steps": 119360, "loss": 0.4047, "lr": 3.0078717503978504e-07, "epoch": 18.00268096514745, "percentage": 90.01, "elapsed_time": "4:14:56", "remaining_time": "0:28:17", "throughput": 4071.49, "total_tokens": 62278896} {"current_steps": 107445, "total_steps": 119360, "loss": 0.2683, "lr": 3.0053746897438895e-07, "epoch": 18.00351876675603, "percentage": 90.02, "elapsed_time": "4:14:56", "remaining_time": "0:28:16", "throughput": 4071.5, "total_tokens": 62281744} {"current_steps": 107450, "total_steps": 119360, "loss": 0.3649, "lr": 3.0028786339030503e-07, "epoch": 18.00435656836461, "percentage": 90.02, "elapsed_time": "4:14:57", "remaining_time": "0:28:15", "throughput": 4071.52, "total_tokens": 62284592} +{"current_steps": 107455, "total_steps": 119360, "loss": 0.2515, "lr": 3.0003835829287287e-07, "epoch": 18.00519436997319, "percentage": 90.03, "elapsed_time": "4:14:58", "remaining_time": "0:28:14", "throughput": 4071.53, "total_tokens": 62288176} +{"current_steps": 107460, "total_steps": 119360, "loss": 0.4803, "lr": 2.997889536874271e-07, "epoch": 18.00603217158177, "percentage": 90.03, "elapsed_time": "4:14:59", "remaining_time": "0:28:14", "throughput": 4071.55, "total_tokens": 62291280} +{"current_steps": 107465, "total_steps": 119360, "loss": 0.5013, "lr": 2.9953964957929906e-07, "epoch": 18.006869973190348, "percentage": 90.03, "elapsed_time": "4:14:59", "remaining_time": "0:28:13", "throughput": 4071.56, "total_tokens": 62294000} +{"current_steps": 107470, "total_steps": 119360, "loss": 0.4264, "lr": 2.9929044597381827e-07, "epoch": 18.007707774798927, "percentage": 90.04, "elapsed_time": "4:15:00", "remaining_time": "0:28:12", "throughput": 4071.56, "total_tokens": 62296624} +{"current_steps": 107475, "total_steps": 119360, "loss": 0.2572, "lr": 2.990413428763167e-07, "epoch": 18.008545576407506, "percentage": 90.04, "elapsed_time": "4:15:01", "remaining_time": "0:28:12", "throughput": 4071.57, "total_tokens": 62299600} +{"current_steps": 107480, "total_steps": 119360, "loss": 0.3764, "lr": 2.987923402921178e-07, "epoch": 18.009383378016086, "percentage": 90.05, "elapsed_time": "4:15:01", "remaining_time": "0:28:11", "throughput": 4071.58, "total_tokens": 62302832} +{"current_steps": 107485, "total_steps": 119360, "loss": 0.2422, "lr": 2.9854343822654563e-07, "epoch": 18.010221179624665, "percentage": 90.05, "elapsed_time": "4:15:02", "remaining_time": "0:28:10", "throughput": 4071.6, "total_tokens": 62305744} +{"current_steps": 107490, "total_steps": 119360, "loss": 0.2792, "lr": 2.982946366849232e-07, "epoch": 18.011058981233244, "percentage": 90.06, "elapsed_time": "4:15:03", "remaining_time": "0:28:09", "throughput": 4071.6, "total_tokens": 62308400} +{"current_steps": 107495, "total_steps": 119360, "loss": 0.3678, "lr": 2.9804593567256954e-07, "epoch": 18.011896782841823, "percentage": 90.06, "elapsed_time": "4:15:03", "remaining_time": "0:28:09", "throughput": 4071.61, "total_tokens": 62311152} +{"current_steps": 107500, "total_steps": 119360, "loss": 0.297, "lr": 2.977973351948021e-07, "epoch": 18.012734584450403, "percentage": 90.06, "elapsed_time": "4:15:04", "remaining_time": "0:28:08", "throughput": 4071.62, "total_tokens": 62314224} +{"current_steps": 107505, "total_steps": 119360, "loss": 0.2737, "lr": 2.975488352569378e-07, "epoch": 18.013572386058982, "percentage": 90.07, "elapsed_time": "4:15:05", "remaining_time": "0:28:07", "throughput": 4071.63, "total_tokens": 62317104} +{"current_steps": 107510, "total_steps": 119360, "loss": 0.3044, "lr": 2.9730043586428726e-07, "epoch": 18.01441018766756, "percentage": 90.07, "elapsed_time": "4:15:05", "remaining_time": "0:28:07", "throughput": 4071.65, "total_tokens": 62320336} +{"current_steps": 107515, "total_steps": 119360, "loss": 0.3493, "lr": 2.970521370221635e-07, "epoch": 18.01524798927614, "percentage": 90.08, "elapsed_time": "4:15:06", "remaining_time": "0:28:06", "throughput": 4071.66, "total_tokens": 62323184} +{"current_steps": 107520, "total_steps": 119360, "loss": 0.4175, "lr": 2.9680393873587623e-07, "epoch": 18.01608579088472, "percentage": 90.08, "elapsed_time": "4:15:07", "remaining_time": "0:28:05", "throughput": 4071.66, "total_tokens": 62325808} +{"current_steps": 107525, "total_steps": 119360, "loss": 0.1769, "lr": 2.9655584101073054e-07, "epoch": 18.0169235924933, "percentage": 90.08, "elapsed_time": "4:15:07", "remaining_time": "0:28:04", "throughput": 4071.67, "total_tokens": 62328656} +{"current_steps": 107530, "total_steps": 119360, "loss": 0.2531, "lr": 2.963078438520306e-07, "epoch": 18.01776139410188, "percentage": 90.09, "elapsed_time": "4:15:08", "remaining_time": "0:28:04", "throughput": 4071.67, "total_tokens": 62331408} +{"current_steps": 107535, "total_steps": 119360, "loss": 0.6512, "lr": 2.960599472650816e-07, "epoch": 18.018599195710454, "percentage": 90.09, "elapsed_time": "4:15:09", "remaining_time": "0:28:03", "throughput": 4071.68, "total_tokens": 62334096} +{"current_steps": 107540, "total_steps": 119360, "loss": 0.2666, "lr": 2.9581215125518204e-07, "epoch": 18.019436997319033, "percentage": 90.1, "elapsed_time": "4:15:09", "remaining_time": "0:28:02", "throughput": 4071.69, "total_tokens": 62337264} +{"current_steps": 107545, "total_steps": 119360, "loss": 0.3321, "lr": 2.955644558276305e-07, "epoch": 18.020274798927613, "percentage": 90.1, "elapsed_time": "4:15:10", "remaining_time": "0:28:02", "throughput": 4071.71, "total_tokens": 62340240} +{"current_steps": 107550, "total_steps": 119360, "loss": 0.2162, "lr": 2.953168609877227e-07, "epoch": 18.021112600536192, "percentage": 90.11, "elapsed_time": "4:15:11", "remaining_time": "0:28:01", "throughput": 4071.72, "total_tokens": 62343120} +{"current_steps": 107555, "total_steps": 119360, "loss": 0.3879, "lr": 2.950693667407534e-07, "epoch": 18.02195040214477, "percentage": 90.11, "elapsed_time": "4:15:11", "remaining_time": "0:28:00", "throughput": 4071.73, "total_tokens": 62346160} +{"current_steps": 107560, "total_steps": 119360, "loss": 0.255, "lr": 2.9482197309201377e-07, "epoch": 18.02278820375335, "percentage": 90.11, "elapsed_time": "4:15:12", "remaining_time": "0:27:59", "throughput": 4071.73, "total_tokens": 62348944} +{"current_steps": 107565, "total_steps": 119360, "loss": 0.2423, "lr": 2.9457468004679466e-07, "epoch": 18.02362600536193, "percentage": 90.12, "elapsed_time": "4:15:13", "remaining_time": "0:27:59", "throughput": 4071.75, "total_tokens": 62352080} +{"current_steps": 107570, "total_steps": 119360, "loss": 0.2901, "lr": 2.943274876103813e-07, "epoch": 18.02446380697051, "percentage": 90.12, "elapsed_time": "4:15:14", "remaining_time": "0:27:58", "throughput": 4071.76, "total_tokens": 62355216} +{"current_steps": 107575, "total_steps": 119360, "loss": 0.1701, "lr": 2.9408039578806e-07, "epoch": 18.02530160857909, "percentage": 90.13, "elapsed_time": "4:15:14", "remaining_time": "0:27:57", "throughput": 4071.77, "total_tokens": 62357968} +{"current_steps": 107580, "total_steps": 119360, "loss": 0.2722, "lr": 2.938334045851154e-07, "epoch": 18.026139410187668, "percentage": 90.13, "elapsed_time": "4:15:15", "remaining_time": "0:27:57", "throughput": 4071.77, "total_tokens": 62360720} +{"current_steps": 107585, "total_steps": 119360, "loss": 0.3217, "lr": 2.935865140068273e-07, "epoch": 18.026977211796247, "percentage": 90.13, "elapsed_time": "4:15:16", "remaining_time": "0:27:56", "throughput": 4071.78, "total_tokens": 62363472} +{"current_steps": 107590, "total_steps": 119360, "loss": 0.4197, "lr": 2.93339724058474e-07, "epoch": 18.027815013404826, "percentage": 90.14, "elapsed_time": "4:15:16", "remaining_time": "0:27:55", "throughput": 4071.78, "total_tokens": 62366160} +{"current_steps": 107595, "total_steps": 119360, "loss": 0.5563, "lr": 2.930930347453326e-07, "epoch": 18.028652815013405, "percentage": 90.14, "elapsed_time": "4:15:17", "remaining_time": "0:27:54", "throughput": 4071.8, "total_tokens": 62369200} +{"current_steps": 107600, "total_steps": 119360, "loss": 0.2535, "lr": 2.928464460726782e-07, "epoch": 18.029490616621985, "percentage": 90.15, "elapsed_time": "4:15:18", "remaining_time": "0:27:54", "throughput": 4071.81, "total_tokens": 62372144} +{"current_steps": 107605, "total_steps": 119360, "loss": 0.4782, "lr": 2.925999580457833e-07, "epoch": 18.030328418230564, "percentage": 90.15, "elapsed_time": "4:15:18", "remaining_time": "0:27:53", "throughput": 4071.83, "total_tokens": 62375216} +{"current_steps": 107610, "total_steps": 119360, "loss": 0.2325, "lr": 2.923535706699182e-07, "epoch": 18.031166219839143, "percentage": 90.16, "elapsed_time": "4:15:19", "remaining_time": "0:27:52", "throughput": 4071.84, "total_tokens": 62378064} +{"current_steps": 107615, "total_steps": 119360, "loss": 0.1817, "lr": 2.9210728395034913e-07, "epoch": 18.032004021447722, "percentage": 90.16, "elapsed_time": "4:15:20", "remaining_time": "0:27:52", "throughput": 4071.85, "total_tokens": 62381168} +{"current_steps": 107620, "total_steps": 119360, "loss": 0.2924, "lr": 2.9186109789234416e-07, "epoch": 18.0328418230563, "percentage": 90.16, "elapsed_time": "4:15:20", "remaining_time": "0:27:51", "throughput": 4071.86, "total_tokens": 62383856} +{"current_steps": 107625, "total_steps": 119360, "loss": 0.2326, "lr": 2.91615012501168e-07, "epoch": 18.03367962466488, "percentage": 90.17, "elapsed_time": "4:15:21", "remaining_time": "0:27:50", "throughput": 4071.86, "total_tokens": 62386576} +{"current_steps": 107630, "total_steps": 119360, "loss": 0.364, "lr": 2.913690277820791e-07, "epoch": 18.03451742627346, "percentage": 90.17, "elapsed_time": "4:15:22", "remaining_time": "0:27:49", "throughput": 4071.86, "total_tokens": 62389232} +{"current_steps": 107635, "total_steps": 119360, "loss": 0.4959, "lr": 2.9112314374033834e-07, "epoch": 18.035355227882036, "percentage": 90.18, "elapsed_time": "4:15:22", "remaining_time": "0:27:49", "throughput": 4071.87, "total_tokens": 62392144} +{"current_steps": 107640, "total_steps": 119360, "loss": 0.1363, "lr": 2.908773603812054e-07, "epoch": 18.036193029490615, "percentage": 90.18, "elapsed_time": "4:15:23", "remaining_time": "0:27:48", "throughput": 4071.89, "total_tokens": 62395408} +{"current_steps": 107645, "total_steps": 119360, "loss": 0.2466, "lr": 2.906316777099322e-07, "epoch": 18.037030831099194, "percentage": 90.19, "elapsed_time": "4:15:24", "remaining_time": "0:27:47", "throughput": 4071.9, "total_tokens": 62398416} +{"current_steps": 107650, "total_steps": 119360, "loss": 0.3352, "lr": 2.9038609573177333e-07, "epoch": 18.037868632707774, "percentage": 90.19, "elapsed_time": "4:15:24", "remaining_time": "0:27:47", "throughput": 4071.92, "total_tokens": 62401584} +{"current_steps": 107655, "total_steps": 119360, "loss": 0.4739, "lr": 2.9014061445197914e-07, "epoch": 18.038706434316353, "percentage": 90.19, "elapsed_time": "4:15:25", "remaining_time": "0:27:46", "throughput": 4071.94, "total_tokens": 62404880} +{"current_steps": 107660, "total_steps": 119360, "loss": 0.2883, "lr": 2.8989523387579876e-07, "epoch": 18.039544235924932, "percentage": 90.2, "elapsed_time": "4:15:26", "remaining_time": "0:27:45", "throughput": 4071.97, "total_tokens": 62408144} +{"current_steps": 107665, "total_steps": 119360, "loss": 0.3073, "lr": 2.8964995400847906e-07, "epoch": 18.04038203753351, "percentage": 90.2, "elapsed_time": "4:15:26", "remaining_time": "0:27:44", "throughput": 4071.97, "total_tokens": 62410704} +{"current_steps": 107670, "total_steps": 119360, "loss": 0.4513, "lr": 2.894047748552647e-07, "epoch": 18.04121983914209, "percentage": 90.21, "elapsed_time": "4:15:27", "remaining_time": "0:27:44", "throughput": 4071.98, "total_tokens": 62413776} +{"current_steps": 107675, "total_steps": 119360, "loss": 0.154, "lr": 2.8915969642139607e-07, "epoch": 18.04205764075067, "percentage": 90.21, "elapsed_time": "4:15:28", "remaining_time": "0:27:43", "throughput": 4071.99, "total_tokens": 62416560} +{"current_steps": 107680, "total_steps": 119360, "loss": 0.5176, "lr": 2.8891471871211497e-07, "epoch": 18.04289544235925, "percentage": 90.21, "elapsed_time": "4:15:28", "remaining_time": "0:27:42", "throughput": 4072.01, "total_tokens": 62419536} +{"current_steps": 107685, "total_steps": 119360, "loss": 0.2804, "lr": 2.8866984173266e-07, "epoch": 18.04373324396783, "percentage": 90.22, "elapsed_time": "4:15:29", "remaining_time": "0:27:42", "throughput": 4072.02, "total_tokens": 62422288} +{"current_steps": 107690, "total_steps": 119360, "loss": 0.26, "lr": 2.884250654882653e-07, "epoch": 18.044571045576408, "percentage": 90.22, "elapsed_time": "4:15:30", "remaining_time": "0:27:41", "throughput": 4072.02, "total_tokens": 62424880} +{"current_steps": 107695, "total_steps": 119360, "loss": 0.3862, "lr": 2.881803899841651e-07, "epoch": 18.045408847184987, "percentage": 90.23, "elapsed_time": "4:15:30", "remaining_time": "0:27:40", "throughput": 4072.03, "total_tokens": 62427536} +{"current_steps": 107700, "total_steps": 119360, "loss": 0.3927, "lr": 2.879358152255912e-07, "epoch": 18.046246648793566, "percentage": 90.23, "elapsed_time": "4:15:31", "remaining_time": "0:27:39", "throughput": 4072.05, "total_tokens": 62430992} +{"current_steps": 107705, "total_steps": 119360, "loss": 0.4789, "lr": 2.8769134121777286e-07, "epoch": 18.047084450402146, "percentage": 90.24, "elapsed_time": "4:15:32", "remaining_time": "0:27:39", "throughput": 4072.05, "total_tokens": 62433552} +{"current_steps": 107710, "total_steps": 119360, "loss": 0.2119, "lr": 2.8744696796593753e-07, "epoch": 18.047922252010725, "percentage": 90.24, "elapsed_time": "4:15:32", "remaining_time": "0:27:38", "throughput": 4072.06, "total_tokens": 62436368} +{"current_steps": 107715, "total_steps": 119360, "loss": 0.1107, "lr": 2.872026954753099e-07, "epoch": 18.048760053619304, "percentage": 90.24, "elapsed_time": "4:15:33", "remaining_time": "0:27:37", "throughput": 4072.06, "total_tokens": 62439152} +{"current_steps": 107720, "total_steps": 119360, "loss": 0.3668, "lr": 2.8695852375111246e-07, "epoch": 18.049597855227884, "percentage": 90.25, "elapsed_time": "4:15:34", "remaining_time": "0:27:36", "throughput": 4072.08, "total_tokens": 62442032} +{"current_steps": 107725, "total_steps": 119360, "loss": 0.3302, "lr": 2.8671445279856716e-07, "epoch": 18.050435656836463, "percentage": 90.25, "elapsed_time": "4:15:34", "remaining_time": "0:27:36", "throughput": 4072.09, "total_tokens": 62444880} +{"current_steps": 107730, "total_steps": 119360, "loss": 0.263, "lr": 2.86470482622892e-07, "epoch": 18.05127345844504, "percentage": 90.26, "elapsed_time": "4:15:35", "remaining_time": "0:27:35", "throughput": 4072.09, "total_tokens": 62447696} +{"current_steps": 107735, "total_steps": 119360, "loss": 0.3051, "lr": 2.862266132293029e-07, "epoch": 18.052111260053618, "percentage": 90.26, "elapsed_time": "4:15:36", "remaining_time": "0:27:34", "throughput": 4072.11, "total_tokens": 62450864} +{"current_steps": 107740, "total_steps": 119360, "loss": 0.1579, "lr": 2.85982844623014e-07, "epoch": 18.052949061662197, "percentage": 90.26, "elapsed_time": "4:15:36", "remaining_time": "0:27:34", "throughput": 4072.12, "total_tokens": 62453776} +{"current_steps": 107745, "total_steps": 119360, "loss": 0.4373, "lr": 2.8573917680923933e-07, "epoch": 18.053786863270776, "percentage": 90.27, "elapsed_time": "4:15:37", "remaining_time": "0:27:33", "throughput": 4072.13, "total_tokens": 62456752} +{"current_steps": 107750, "total_steps": 119360, "loss": 0.4339, "lr": 2.854956097931866e-07, "epoch": 18.054624664879356, "percentage": 90.27, "elapsed_time": "4:15:38", "remaining_time": "0:27:32", "throughput": 4072.15, "total_tokens": 62460144} +{"current_steps": 107755, "total_steps": 119360, "loss": 0.6346, "lr": 2.852521435800648e-07, "epoch": 18.055462466487935, "percentage": 90.28, "elapsed_time": "4:15:39", "remaining_time": "0:27:31", "throughput": 4072.15, "total_tokens": 62463120} +{"current_steps": 107760, "total_steps": 119360, "loss": 0.3153, "lr": 2.850087781750793e-07, "epoch": 18.056300268096514, "percentage": 90.28, "elapsed_time": "4:15:39", "remaining_time": "0:27:31", "throughput": 4072.16, "total_tokens": 62465872} +{"current_steps": 107765, "total_steps": 119360, "loss": 0.3317, "lr": 2.847655135834332e-07, "epoch": 18.057138069705093, "percentage": 90.29, "elapsed_time": "4:15:40", "remaining_time": "0:27:30", "throughput": 4072.18, "total_tokens": 62468912} +{"current_steps": 107770, "total_steps": 119360, "loss": 0.4613, "lr": 2.845223498103289e-07, "epoch": 18.057975871313673, "percentage": 90.29, "elapsed_time": "4:15:41", "remaining_time": "0:27:29", "throughput": 4072.19, "total_tokens": 62471888} +{"current_steps": 107775, "total_steps": 119360, "loss": 0.4046, "lr": 2.8427928686096506e-07, "epoch": 18.058813672922252, "percentage": 90.29, "elapsed_time": "4:15:41", "remaining_time": "0:27:29", "throughput": 4072.2, "total_tokens": 62474800} +{"current_steps": 107780, "total_steps": 119360, "loss": 0.3397, "lr": 2.8403632474053756e-07, "epoch": 18.05965147453083, "percentage": 90.3, "elapsed_time": "4:15:42", "remaining_time": "0:27:28", "throughput": 4072.21, "total_tokens": 62477648} +{"current_steps": 107785, "total_steps": 119360, "loss": 0.4459, "lr": 2.837934634542433e-07, "epoch": 18.06048927613941, "percentage": 90.3, "elapsed_time": "4:15:43", "remaining_time": "0:27:27", "throughput": 4072.23, "total_tokens": 62480560} +{"current_steps": 107790, "total_steps": 119360, "loss": 0.2579, "lr": 2.835507030072743e-07, "epoch": 18.06132707774799, "percentage": 90.31, "elapsed_time": "4:15:43", "remaining_time": "0:27:26", "throughput": 4072.24, "total_tokens": 62483600} +{"current_steps": 107795, "total_steps": 119360, "loss": 0.3146, "lr": 2.8330804340482077e-07, "epoch": 18.06216487935657, "percentage": 90.31, "elapsed_time": "4:15:44", "remaining_time": "0:27:26", "throughput": 4072.25, "total_tokens": 62486608} +{"current_steps": 107800, "total_steps": 119360, "loss": 0.224, "lr": 2.8306548465207083e-07, "epoch": 18.06300268096515, "percentage": 90.32, "elapsed_time": "4:15:45", "remaining_time": "0:27:25", "throughput": 4072.26, "total_tokens": 62489424} +{"current_steps": 107805, "total_steps": 119360, "loss": 0.3285, "lr": 2.828230267542109e-07, "epoch": 18.063840482573728, "percentage": 90.32, "elapsed_time": "4:15:45", "remaining_time": "0:27:24", "throughput": 4072.27, "total_tokens": 62492624} +{"current_steps": 107810, "total_steps": 119360, "loss": 0.5443, "lr": 2.8258066971642573e-07, "epoch": 18.064678284182307, "percentage": 90.32, "elapsed_time": "4:15:46", "remaining_time": "0:27:24", "throughput": 4072.28, "total_tokens": 62495600} +{"current_steps": 107815, "total_steps": 119360, "loss": 0.3059, "lr": 2.823384135438967e-07, "epoch": 18.065516085790886, "percentage": 90.33, "elapsed_time": "4:15:47", "remaining_time": "0:27:23", "throughput": 4072.29, "total_tokens": 62498544} +{"current_steps": 107820, "total_steps": 119360, "loss": 0.4477, "lr": 2.820962582418041e-07, "epoch": 18.066353887399465, "percentage": 90.33, "elapsed_time": "4:15:47", "remaining_time": "0:27:22", "throughput": 4072.3, "total_tokens": 62501392} +{"current_steps": 107825, "total_steps": 119360, "loss": 0.3579, "lr": 2.818542038153249e-07, "epoch": 18.067191689008045, "percentage": 90.34, "elapsed_time": "4:15:48", "remaining_time": "0:27:21", "throughput": 4072.31, "total_tokens": 62504304} +{"current_steps": 107830, "total_steps": 119360, "loss": 0.3879, "lr": 2.81612250269635e-07, "epoch": 18.06802949061662, "percentage": 90.34, "elapsed_time": "4:15:49", "remaining_time": "0:27:21", "throughput": 4072.32, "total_tokens": 62506992} +{"current_steps": 107835, "total_steps": 119360, "loss": 0.3516, "lr": 2.813703976099086e-07, "epoch": 18.0688672922252, "percentage": 90.34, "elapsed_time": "4:15:49", "remaining_time": "0:27:20", "throughput": 4072.32, "total_tokens": 62509616} +{"current_steps": 107840, "total_steps": 119360, "loss": 0.328, "lr": 2.811286458413137e-07, "epoch": 18.06970509383378, "percentage": 90.35, "elapsed_time": "4:15:50", "remaining_time": "0:27:19", "throughput": 4072.33, "total_tokens": 62512336} +{"current_steps": 107845, "total_steps": 119360, "loss": 0.3922, "lr": 2.808869949690229e-07, "epoch": 18.070542895442358, "percentage": 90.35, "elapsed_time": "4:15:51", "remaining_time": "0:27:19", "throughput": 4072.35, "total_tokens": 62515472} +{"current_steps": 107850, "total_steps": 119360, "loss": 0.4554, "lr": 2.8064544499820213e-07, "epoch": 18.071380697050937, "percentage": 90.36, "elapsed_time": "4:15:51", "remaining_time": "0:27:18", "throughput": 4072.36, "total_tokens": 62518256} +{"current_steps": 107855, "total_steps": 119360, "loss": 0.4551, "lr": 2.804039959340149e-07, "epoch": 18.072218498659517, "percentage": 90.36, "elapsed_time": "4:15:52", "remaining_time": "0:27:17", "throughput": 4072.36, "total_tokens": 62521072} +{"current_steps": 107860, "total_steps": 119360, "loss": 0.4331, "lr": 2.801626477816244e-07, "epoch": 18.073056300268096, "percentage": 90.37, "elapsed_time": "4:15:53", "remaining_time": "0:27:16", "throughput": 4072.37, "total_tokens": 62523856} +{"current_steps": 107865, "total_steps": 119360, "loss": 0.3147, "lr": 2.7992140054619086e-07, "epoch": 18.073894101876675, "percentage": 90.37, "elapsed_time": "4:15:53", "remaining_time": "0:27:16", "throughput": 4072.38, "total_tokens": 62526672} +{"current_steps": 107870, "total_steps": 119360, "loss": 0.1712, "lr": 2.796802542328725e-07, "epoch": 18.074731903485254, "percentage": 90.37, "elapsed_time": "4:15:54", "remaining_time": "0:27:15", "throughput": 4072.39, "total_tokens": 62529488} +{"current_steps": 107875, "total_steps": 119360, "loss": 0.3247, "lr": 2.7943920884682617e-07, "epoch": 18.075569705093834, "percentage": 90.38, "elapsed_time": "4:15:55", "remaining_time": "0:27:14", "throughput": 4072.4, "total_tokens": 62532208} +{"current_steps": 107880, "total_steps": 119360, "loss": 0.145, "lr": 2.791982643932045e-07, "epoch": 18.076407506702413, "percentage": 90.38, "elapsed_time": "4:15:55", "remaining_time": "0:27:14", "throughput": 4072.4, "total_tokens": 62535088} +{"current_steps": 107885, "total_steps": 119360, "loss": 0.155, "lr": 2.7895742087716e-07, "epoch": 18.077245308310992, "percentage": 90.39, "elapsed_time": "4:15:56", "remaining_time": "0:27:13", "throughput": 4072.42, "total_tokens": 62538032} +{"current_steps": 107890, "total_steps": 119360, "loss": 0.3674, "lr": 2.7871667830384254e-07, "epoch": 18.07808310991957, "percentage": 90.39, "elapsed_time": "4:15:57", "remaining_time": "0:27:12", "throughput": 4072.43, "total_tokens": 62541104} +{"current_steps": 107895, "total_steps": 119360, "loss": 0.1709, "lr": 2.784760366783995e-07, "epoch": 18.07892091152815, "percentage": 90.39, "elapsed_time": "4:15:57", "remaining_time": "0:27:11", "throughput": 4072.45, "total_tokens": 62544080} +{"current_steps": 107900, "total_steps": 119360, "loss": 0.3872, "lr": 2.782354960059741e-07, "epoch": 18.07975871313673, "percentage": 90.4, "elapsed_time": "4:15:58", "remaining_time": "0:27:11", "throughput": 4072.46, "total_tokens": 62547248} +{"current_steps": 107905, "total_steps": 119360, "loss": 0.3532, "lr": 2.7799505629171273e-07, "epoch": 18.08059651474531, "percentage": 90.4, "elapsed_time": "4:15:59", "remaining_time": "0:27:10", "throughput": 4072.47, "total_tokens": 62550032} +{"current_steps": 107910, "total_steps": 119360, "loss": 0.4092, "lr": 2.777547175407541e-07, "epoch": 18.08143431635389, "percentage": 90.41, "elapsed_time": "4:15:59", "remaining_time": "0:27:09", "throughput": 4072.48, "total_tokens": 62552944} +{"current_steps": 107915, "total_steps": 119360, "loss": 0.1596, "lr": 2.7751447975823795e-07, "epoch": 18.082272117962468, "percentage": 90.41, "elapsed_time": "4:16:00", "remaining_time": "0:27:09", "throughput": 4072.5, "total_tokens": 62556080} +{"current_steps": 107920, "total_steps": 119360, "loss": 0.312, "lr": 2.7727434294930023e-07, "epoch": 18.083109919571047, "percentage": 90.42, "elapsed_time": "4:16:01", "remaining_time": "0:27:08", "throughput": 4072.51, "total_tokens": 62558832} +{"current_steps": 107925, "total_steps": 119360, "loss": 0.4625, "lr": 2.770343071190756e-07, "epoch": 18.083947721179623, "percentage": 90.42, "elapsed_time": "4:16:01", "remaining_time": "0:27:07", "throughput": 4072.52, "total_tokens": 62561808} +{"current_steps": 107930, "total_steps": 119360, "loss": 0.5335, "lr": 2.7679437227269676e-07, "epoch": 18.084785522788202, "percentage": 90.42, "elapsed_time": "4:16:02", "remaining_time": "0:27:06", "throughput": 4072.53, "total_tokens": 62564720} +{"current_steps": 107935, "total_steps": 119360, "loss": 0.1228, "lr": 2.7655453841529345e-07, "epoch": 18.08562332439678, "percentage": 90.43, "elapsed_time": "4:16:03", "remaining_time": "0:27:06", "throughput": 4072.56, "total_tokens": 62567920} +{"current_steps": 107940, "total_steps": 119360, "loss": 0.218, "lr": 2.7631480555199483e-07, "epoch": 18.08646112600536, "percentage": 90.43, "elapsed_time": "4:16:03", "remaining_time": "0:27:05", "throughput": 4072.56, "total_tokens": 62570736} +{"current_steps": 107945, "total_steps": 119360, "loss": 0.1582, "lr": 2.7607517368792414e-07, "epoch": 18.08729892761394, "percentage": 90.44, "elapsed_time": "4:16:04", "remaining_time": "0:27:04", "throughput": 4072.58, "total_tokens": 62573808} +{"current_steps": 107950, "total_steps": 119360, "loss": 0.296, "lr": 2.758356428282083e-07, "epoch": 18.08813672922252, "percentage": 90.44, "elapsed_time": "4:16:05", "remaining_time": "0:27:04", "throughput": 4072.59, "total_tokens": 62576944} +{"current_steps": 107955, "total_steps": 119360, "loss": 0.1697, "lr": 2.755962129779666e-07, "epoch": 18.0889745308311, "percentage": 90.44, "elapsed_time": "4:16:06", "remaining_time": "0:27:03", "throughput": 4072.6, "total_tokens": 62580080} +{"current_steps": 107960, "total_steps": 119360, "loss": 0.3807, "lr": 2.7535688414231877e-07, "epoch": 18.089812332439678, "percentage": 90.45, "elapsed_time": "4:16:06", "remaining_time": "0:27:02", "throughput": 4072.61, "total_tokens": 62582896} +{"current_steps": 107965, "total_steps": 119360, "loss": 0.1641, "lr": 2.7511765632638245e-07, "epoch": 18.090650134048257, "percentage": 90.45, "elapsed_time": "4:16:07", "remaining_time": "0:27:01", "throughput": 4072.62, "total_tokens": 62585936} +{"current_steps": 107970, "total_steps": 119360, "loss": 0.1109, "lr": 2.748785295352724e-07, "epoch": 18.091487935656836, "percentage": 90.46, "elapsed_time": "4:16:08", "remaining_time": "0:27:01", "throughput": 4072.63, "total_tokens": 62588880} +{"current_steps": 107975, "total_steps": 119360, "loss": 0.4052, "lr": 2.746395037741012e-07, "epoch": 18.092325737265416, "percentage": 90.46, "elapsed_time": "4:16:08", "remaining_time": "0:27:00", "throughput": 4072.64, "total_tokens": 62591632} +{"current_steps": 107980, "total_steps": 119360, "loss": 0.3433, "lr": 2.7440057904798034e-07, "epoch": 18.093163538873995, "percentage": 90.47, "elapsed_time": "4:16:09", "remaining_time": "0:26:59", "throughput": 4072.65, "total_tokens": 62594480} +{"current_steps": 107985, "total_steps": 119360, "loss": 0.3491, "lr": 2.7416175536201794e-07, "epoch": 18.094001340482574, "percentage": 90.47, "elapsed_time": "4:16:10", "remaining_time": "0:26:59", "throughput": 4072.66, "total_tokens": 62597264} +{"current_steps": 107990, "total_steps": 119360, "loss": 0.3706, "lr": 2.739230327213199e-07, "epoch": 18.094839142091153, "percentage": 90.47, "elapsed_time": "4:16:10", "remaining_time": "0:26:58", "throughput": 4072.66, "total_tokens": 62600112} +{"current_steps": 107995, "total_steps": 119360, "loss": 0.2794, "lr": 2.7368441113099165e-07, "epoch": 18.095676943699733, "percentage": 90.48, "elapsed_time": "4:16:11", "remaining_time": "0:26:57", "throughput": 4072.68, "total_tokens": 62603280} +{"current_steps": 108000, "total_steps": 119360, "loss": 0.3444, "lr": 2.7344589059613514e-07, "epoch": 18.096514745308312, "percentage": 90.48, "elapsed_time": "4:16:12", "remaining_time": "0:26:56", "throughput": 4072.68, "total_tokens": 62606032} +{"current_steps": 108005, "total_steps": 119360, "loss": 0.3828, "lr": 2.73207471121848e-07, "epoch": 18.09735254691689, "percentage": 90.49, "elapsed_time": "4:16:12", "remaining_time": "0:26:56", "throughput": 4072.7, "total_tokens": 62609200} +{"current_steps": 108010, "total_steps": 119360, "loss": 0.25, "lr": 2.7296915271323164e-07, "epoch": 18.09819034852547, "percentage": 90.49, "elapsed_time": "4:16:13", "remaining_time": "0:26:55", "throughput": 4072.71, "total_tokens": 62612144} +{"current_steps": 108015, "total_steps": 119360, "loss": 0.2399, "lr": 2.727309353753788e-07, "epoch": 18.09902815013405, "percentage": 90.5, "elapsed_time": "4:16:14", "remaining_time": "0:26:54", "throughput": 4072.71, "total_tokens": 62614864} +{"current_steps": 108020, "total_steps": 119360, "loss": 0.3497, "lr": 2.724928191133841e-07, "epoch": 18.09986595174263, "percentage": 90.5, "elapsed_time": "4:16:14", "remaining_time": "0:26:54", "throughput": 4072.72, "total_tokens": 62617840} +{"current_steps": 108025, "total_steps": 119360, "loss": 0.145, "lr": 2.7225480393233803e-07, "epoch": 18.100703753351205, "percentage": 90.5, "elapsed_time": "4:16:15", "remaining_time": "0:26:53", "throughput": 4072.73, "total_tokens": 62620848} +{"current_steps": 108030, "total_steps": 119360, "loss": 0.4636, "lr": 2.720168898373304e-07, "epoch": 18.101541554959784, "percentage": 90.51, "elapsed_time": "4:16:16", "remaining_time": "0:26:52", "throughput": 4072.75, "total_tokens": 62623920} +{"current_steps": 108035, "total_steps": 119360, "loss": 0.0915, "lr": 2.717790768334483e-07, "epoch": 18.102379356568363, "percentage": 90.51, "elapsed_time": "4:16:16", "remaining_time": "0:26:51", "throughput": 4072.76, "total_tokens": 62626768} +{"current_steps": 108040, "total_steps": 119360, "loss": 0.2628, "lr": 2.7154136492577586e-07, "epoch": 18.103217158176943, "percentage": 90.52, "elapsed_time": "4:16:17", "remaining_time": "0:26:51", "throughput": 4072.77, "total_tokens": 62629648} +{"current_steps": 108045, "total_steps": 119360, "loss": 0.3756, "lr": 2.7130375411939635e-07, "epoch": 18.104054959785522, "percentage": 90.52, "elapsed_time": "4:16:18", "remaining_time": "0:26:50", "throughput": 4072.79, "total_tokens": 62632752} +{"current_steps": 108050, "total_steps": 119360, "loss": 0.4189, "lr": 2.7106624441938956e-07, "epoch": 18.1048927613941, "percentage": 90.52, "elapsed_time": "4:16:19", "remaining_time": "0:26:49", "throughput": 4072.79, "total_tokens": 62635504} +{"current_steps": 108055, "total_steps": 119360, "loss": 0.537, "lr": 2.708288358308353e-07, "epoch": 18.10573056300268, "percentage": 90.53, "elapsed_time": "4:16:19", "remaining_time": "0:26:49", "throughput": 4072.8, "total_tokens": 62638352} +{"current_steps": 108060, "total_steps": 119360, "loss": 0.6529, "lr": 2.7059152835880784e-07, "epoch": 18.10656836461126, "percentage": 90.53, "elapsed_time": "4:16:20", "remaining_time": "0:26:48", "throughput": 4072.81, "total_tokens": 62641328} +{"current_steps": 108065, "total_steps": 119360, "loss": 0.4511, "lr": 2.7035432200838096e-07, "epoch": 18.10740616621984, "percentage": 90.54, "elapsed_time": "4:16:21", "remaining_time": "0:26:47", "throughput": 4072.82, "total_tokens": 62644080} +{"current_steps": 108070, "total_steps": 119360, "loss": 0.0811, "lr": 2.7011721678462885e-07, "epoch": 18.108243967828418, "percentage": 90.54, "elapsed_time": "4:16:21", "remaining_time": "0:26:46", "throughput": 4072.83, "total_tokens": 62647024} +{"current_steps": 108075, "total_steps": 119360, "loss": 0.2731, "lr": 2.698802126926192e-07, "epoch": 18.109081769436997, "percentage": 90.55, "elapsed_time": "4:16:22", "remaining_time": "0:26:46", "throughput": 4072.85, "total_tokens": 62650064} +{"current_steps": 108080, "total_steps": 119360, "loss": 0.2478, "lr": 2.696433097374196e-07, "epoch": 18.109919571045577, "percentage": 90.55, "elapsed_time": "4:16:23", "remaining_time": "0:26:45", "throughput": 4072.85, "total_tokens": 62652784} +{"current_steps": 108085, "total_steps": 119360, "loss": 0.3356, "lr": 2.6940650792409596e-07, "epoch": 18.110757372654156, "percentage": 90.55, "elapsed_time": "4:16:23", "remaining_time": "0:26:44", "throughput": 4072.86, "total_tokens": 62655664} +{"current_steps": 108090, "total_steps": 119360, "loss": 0.6206, "lr": 2.691698072577115e-07, "epoch": 18.111595174262735, "percentage": 90.56, "elapsed_time": "4:16:24", "remaining_time": "0:26:44", "throughput": 4072.86, "total_tokens": 62658448} +{"current_steps": 108095, "total_steps": 119360, "loss": 0.2363, "lr": 2.689332077433271e-07, "epoch": 18.112432975871315, "percentage": 90.56, "elapsed_time": "4:16:25", "remaining_time": "0:26:43", "throughput": 4072.87, "total_tokens": 62661296} +{"current_steps": 108100, "total_steps": 119360, "loss": 0.2346, "lr": 2.68696709386001e-07, "epoch": 18.113270777479894, "percentage": 90.57, "elapsed_time": "4:16:25", "remaining_time": "0:26:42", "throughput": 4072.88, "total_tokens": 62664144} +{"current_steps": 108105, "total_steps": 119360, "loss": 0.2387, "lr": 2.684603121907914e-07, "epoch": 18.114108579088473, "percentage": 90.57, "elapsed_time": "4:16:26", "remaining_time": "0:26:41", "throughput": 4072.89, "total_tokens": 62666992} +{"current_steps": 108110, "total_steps": 119360, "loss": 0.3778, "lr": 2.682240161627503e-07, "epoch": 18.114946380697052, "percentage": 90.57, "elapsed_time": "4:16:27", "remaining_time": "0:26:41", "throughput": 4072.9, "total_tokens": 62670128} +{"current_steps": 108115, "total_steps": 119360, "loss": 0.1339, "lr": 2.679878213069331e-07, "epoch": 18.11578418230563, "percentage": 90.58, "elapsed_time": "4:16:27", "remaining_time": "0:26:40", "throughput": 4072.91, "total_tokens": 62673040} +{"current_steps": 108120, "total_steps": 119360, "loss": 0.2481, "lr": 2.677517276283875e-07, "epoch": 18.11662198391421, "percentage": 90.58, "elapsed_time": "4:16:28", "remaining_time": "0:26:39", "throughput": 4072.92, "total_tokens": 62676368} +{"current_steps": 108125, "total_steps": 119360, "loss": 0.2326, "lr": 2.675157351321628e-07, "epoch": 18.117459785522787, "percentage": 90.59, "elapsed_time": "4:16:29", "remaining_time": "0:26:39", "throughput": 4072.93, "total_tokens": 62679504} +{"current_steps": 108130, "total_steps": 119360, "loss": 0.3046, "lr": 2.672798438233043e-07, "epoch": 18.118297587131366, "percentage": 90.59, "elapsed_time": "4:16:29", "remaining_time": "0:26:38", "throughput": 4072.95, "total_tokens": 62682480} +{"current_steps": 108135, "total_steps": 119360, "loss": 0.3182, "lr": 2.670440537068564e-07, "epoch": 18.119135388739945, "percentage": 90.6, "elapsed_time": "4:16:30", "remaining_time": "0:26:37", "throughput": 4072.96, "total_tokens": 62685264} +{"current_steps": 108140, "total_steps": 119360, "loss": 0.4143, "lr": 2.668083647878594e-07, "epoch": 18.119973190348524, "percentage": 90.6, "elapsed_time": "4:16:31", "remaining_time": "0:26:36", "throughput": 4072.98, "total_tokens": 62688720} +{"current_steps": 108145, "total_steps": 119360, "loss": 0.2404, "lr": 2.665727770713539e-07, "epoch": 18.120810991957104, "percentage": 90.6, "elapsed_time": "4:16:32", "remaining_time": "0:26:36", "throughput": 4072.98, "total_tokens": 62691376} +{"current_steps": 108150, "total_steps": 119360, "loss": 0.2499, "lr": 2.6633729056237625e-07, "epoch": 18.121648793565683, "percentage": 90.61, "elapsed_time": "4:16:32", "remaining_time": "0:26:35", "throughput": 4072.99, "total_tokens": 62694288} +{"current_steps": 108155, "total_steps": 119360, "loss": 0.4467, "lr": 2.661019052659625e-07, "epoch": 18.122486595174262, "percentage": 90.61, "elapsed_time": "4:16:33", "remaining_time": "0:26:34", "throughput": 4073.01, "total_tokens": 62697424} +{"current_steps": 108160, "total_steps": 119360, "loss": 0.6459, "lr": 2.658666211871452e-07, "epoch": 18.12332439678284, "percentage": 90.62, "elapsed_time": "4:16:34", "remaining_time": "0:26:34", "throughput": 4073.03, "total_tokens": 62700560} +{"current_steps": 108165, "total_steps": 119360, "loss": 0.233, "lr": 2.6563143833095383e-07, "epoch": 18.12416219839142, "percentage": 90.62, "elapsed_time": "4:16:34", "remaining_time": "0:26:33", "throughput": 4073.04, "total_tokens": 62703504} +{"current_steps": 108170, "total_steps": 119360, "loss": 0.513, "lr": 2.653963567024176e-07, "epoch": 18.125, "percentage": 90.62, "elapsed_time": "4:16:35", "remaining_time": "0:26:32", "throughput": 4073.06, "total_tokens": 62706480} +{"current_steps": 108175, "total_steps": 119360, "loss": 0.3317, "lr": 2.6516137630656414e-07, "epoch": 18.12583780160858, "percentage": 90.63, "elapsed_time": "4:16:36", "remaining_time": "0:26:31", "throughput": 4073.06, "total_tokens": 62709264} +{"current_steps": 108180, "total_steps": 119360, "loss": 0.4919, "lr": 2.6492649714841667e-07, "epoch": 18.12667560321716, "percentage": 90.63, "elapsed_time": "4:16:36", "remaining_time": "0:26:31", "throughput": 4073.08, "total_tokens": 62712208} +{"current_steps": 108185, "total_steps": 119360, "loss": 0.1631, "lr": 2.6469171923299675e-07, "epoch": 18.127513404825738, "percentage": 90.64, "elapsed_time": "4:16:37", "remaining_time": "0:26:30", "throughput": 4073.09, "total_tokens": 62715184} +{"current_steps": 108190, "total_steps": 119360, "loss": 0.4362, "lr": 2.6445704256532476e-07, "epoch": 18.128351206434317, "percentage": 90.64, "elapsed_time": "4:16:38", "remaining_time": "0:26:29", "throughput": 4073.09, "total_tokens": 62717936} +{"current_steps": 108195, "total_steps": 119360, "loss": 0.2198, "lr": 2.64222467150419e-07, "epoch": 18.129189008042896, "percentage": 90.65, "elapsed_time": "4:16:38", "remaining_time": "0:26:29", "throughput": 4073.1, "total_tokens": 62720816} +{"current_steps": 108200, "total_steps": 119360, "loss": 0.2851, "lr": 2.6398799299329425e-07, "epoch": 18.130026809651476, "percentage": 90.65, "elapsed_time": "4:16:39", "remaining_time": "0:26:28", "throughput": 4073.11, "total_tokens": 62723920} +{"current_steps": 108205, "total_steps": 119360, "loss": 0.4179, "lr": 2.6375362009896433e-07, "epoch": 18.130864611260055, "percentage": 90.65, "elapsed_time": "4:16:40", "remaining_time": "0:26:27", "throughput": 4073.13, "total_tokens": 62726832} +{"current_steps": 108210, "total_steps": 119360, "loss": 0.3948, "lr": 2.6351934847243965e-07, "epoch": 18.131702412868634, "percentage": 90.66, "elapsed_time": "4:16:40", "remaining_time": "0:26:26", "throughput": 4073.14, "total_tokens": 62730000} +{"current_steps": 108215, "total_steps": 119360, "loss": 0.4761, "lr": 2.632851781187301e-07, "epoch": 18.132540214477213, "percentage": 90.66, "elapsed_time": "4:16:41", "remaining_time": "0:26:26", "throughput": 4073.15, "total_tokens": 62732816} +{"current_steps": 108220, "total_steps": 119360, "loss": 0.3315, "lr": 2.6305110904284337e-07, "epoch": 18.13337801608579, "percentage": 90.67, "elapsed_time": "4:16:42", "remaining_time": "0:26:25", "throughput": 4073.17, "total_tokens": 62735984} +{"current_steps": 108225, "total_steps": 119360, "loss": 0.3417, "lr": 2.6281714124978263e-07, "epoch": 18.13421581769437, "percentage": 90.67, "elapsed_time": "4:16:42", "remaining_time": "0:26:24", "throughput": 4073.18, "total_tokens": 62738800} +{"current_steps": 108230, "total_steps": 119360, "loss": 0.1973, "lr": 2.6258327474455004e-07, "epoch": 18.135053619302948, "percentage": 90.68, "elapsed_time": "4:16:43", "remaining_time": "0:26:24", "throughput": 4073.2, "total_tokens": 62742160} +{"current_steps": 108235, "total_steps": 119360, "loss": 0.3735, "lr": 2.6234950953214875e-07, "epoch": 18.135891420911527, "percentage": 90.68, "elapsed_time": "4:16:44", "remaining_time": "0:26:23", "throughput": 4073.21, "total_tokens": 62745200} +{"current_steps": 108240, "total_steps": 119360, "loss": 0.3083, "lr": 2.621158456175743e-07, "epoch": 18.136729222520106, "percentage": 90.68, "elapsed_time": "4:16:45", "remaining_time": "0:26:22", "throughput": 4073.22, "total_tokens": 62748048} +{"current_steps": 108245, "total_steps": 119360, "loss": 0.4541, "lr": 2.6188228300582376e-07, "epoch": 18.137567024128685, "percentage": 90.69, "elapsed_time": "4:16:45", "remaining_time": "0:26:21", "throughput": 4073.22, "total_tokens": 62750800} +{"current_steps": 108250, "total_steps": 119360, "loss": 0.2184, "lr": 2.6164882170189144e-07, "epoch": 18.138404825737265, "percentage": 90.69, "elapsed_time": "4:16:46", "remaining_time": "0:26:21", "throughput": 4073.23, "total_tokens": 62753776} +{"current_steps": 108255, "total_steps": 119360, "loss": 0.2242, "lr": 2.614154617107684e-07, "epoch": 18.139242627345844, "percentage": 90.7, "elapsed_time": "4:16:47", "remaining_time": "0:26:20", "throughput": 4073.25, "total_tokens": 62756880} +{"current_steps": 108260, "total_steps": 119360, "loss": 0.4377, "lr": 2.611822030374439e-07, "epoch": 18.140080428954423, "percentage": 90.7, "elapsed_time": "4:16:47", "remaining_time": "0:26:19", "throughput": 4073.27, "total_tokens": 62760016} +{"current_steps": 108265, "total_steps": 119360, "loss": 0.2666, "lr": 2.609490456869074e-07, "epoch": 18.140918230563003, "percentage": 90.7, "elapsed_time": "4:16:48", "remaining_time": "0:26:19", "throughput": 4073.29, "total_tokens": 62763216} +{"current_steps": 108270, "total_steps": 119360, "loss": 0.3595, "lr": 2.6071598966414146e-07, "epoch": 18.141756032171582, "percentage": 90.71, "elapsed_time": "4:16:49", "remaining_time": "0:26:18", "throughput": 4073.29, "total_tokens": 62765936} +{"current_steps": 108275, "total_steps": 119360, "loss": 0.3353, "lr": 2.6048303497413e-07, "epoch": 18.14259383378016, "percentage": 90.71, "elapsed_time": "4:16:49", "remaining_time": "0:26:17", "throughput": 4073.3, "total_tokens": 62768624} +{"current_steps": 108280, "total_steps": 119360, "loss": 0.2583, "lr": 2.602501816218556e-07, "epoch": 18.14343163538874, "percentage": 90.72, "elapsed_time": "4:16:50", "remaining_time": "0:26:16", "throughput": 4073.31, "total_tokens": 62771440} +{"current_steps": 108285, "total_steps": 119360, "loss": 0.4499, "lr": 2.600174296122948e-07, "epoch": 18.14426943699732, "percentage": 90.72, "elapsed_time": "4:16:51", "remaining_time": "0:26:16", "throughput": 4073.32, "total_tokens": 62774288} +{"current_steps": 108290, "total_steps": 119360, "loss": 0.2297, "lr": 2.5978477895042484e-07, "epoch": 18.1451072386059, "percentage": 90.73, "elapsed_time": "4:16:51", "remaining_time": "0:26:15", "throughput": 4073.33, "total_tokens": 62777136} +{"current_steps": 108295, "total_steps": 119360, "loss": 0.4209, "lr": 2.5955222964122115e-07, "epoch": 18.145945040214478, "percentage": 90.73, "elapsed_time": "4:16:52", "remaining_time": "0:26:14", "throughput": 4073.34, "total_tokens": 62780080} +{"current_steps": 108300, "total_steps": 119360, "loss": 0.4525, "lr": 2.593197816896542e-07, "epoch": 18.146782841823057, "percentage": 90.73, "elapsed_time": "4:16:53", "remaining_time": "0:26:14", "throughput": 4073.35, "total_tokens": 62782736} +{"current_steps": 108305, "total_steps": 119360, "loss": 0.354, "lr": 2.590874351006956e-07, "epoch": 18.147620643431637, "percentage": 90.74, "elapsed_time": "4:16:53", "remaining_time": "0:26:13", "throughput": 4073.36, "total_tokens": 62785520} +{"current_steps": 108310, "total_steps": 119360, "loss": 0.2825, "lr": 2.588551898793135e-07, "epoch": 18.148458445040216, "percentage": 90.74, "elapsed_time": "4:16:54", "remaining_time": "0:26:12", "throughput": 4073.37, "total_tokens": 62788432} +{"current_steps": 108315, "total_steps": 119360, "loss": 0.5162, "lr": 2.5862304603047117e-07, "epoch": 18.149296246648795, "percentage": 90.75, "elapsed_time": "4:16:55", "remaining_time": "0:26:11", "throughput": 4073.39, "total_tokens": 62791568} +{"current_steps": 108320, "total_steps": 119360, "loss": 0.2624, "lr": 2.583910035591347e-07, "epoch": 18.15013404825737, "percentage": 90.75, "elapsed_time": "4:16:55", "remaining_time": "0:26:11", "throughput": 4073.39, "total_tokens": 62794416} +{"current_steps": 108325, "total_steps": 119360, "loss": 0.6329, "lr": 2.5815906247026514e-07, "epoch": 18.15097184986595, "percentage": 90.75, "elapsed_time": "4:16:56", "remaining_time": "0:26:10", "throughput": 4073.4, "total_tokens": 62797200} +{"current_steps": 108330, "total_steps": 119360, "loss": 0.385, "lr": 2.5792722276882064e-07, "epoch": 18.15180965147453, "percentage": 90.76, "elapsed_time": "4:16:57", "remaining_time": "0:26:09", "throughput": 4073.42, "total_tokens": 62800432} +{"current_steps": 108335, "total_steps": 119360, "loss": 0.4238, "lr": 2.576954844597579e-07, "epoch": 18.15264745308311, "percentage": 90.76, "elapsed_time": "4:16:57", "remaining_time": "0:26:09", "throughput": 4073.43, "total_tokens": 62803248} +{"current_steps": 108340, "total_steps": 119360, "loss": 0.3085, "lr": 2.57463847548034e-07, "epoch": 18.153485254691688, "percentage": 90.77, "elapsed_time": "4:16:58", "remaining_time": "0:26:08", "throughput": 4073.43, "total_tokens": 62805904} +{"current_steps": 108345, "total_steps": 119360, "loss": 0.5044, "lr": 2.5723231203860057e-07, "epoch": 18.154323056300267, "percentage": 90.77, "elapsed_time": "4:16:59", "remaining_time": "0:26:07", "throughput": 4073.44, "total_tokens": 62808816} +{"current_steps": 108350, "total_steps": 119360, "loss": 0.4629, "lr": 2.570008779364075e-07, "epoch": 18.155160857908847, "percentage": 90.78, "elapsed_time": "4:16:59", "remaining_time": "0:26:06", "throughput": 4073.45, "total_tokens": 62811792} +{"current_steps": 108355, "total_steps": 119360, "loss": 0.4552, "lr": 2.567695452464036e-07, "epoch": 18.155998659517426, "percentage": 90.78, "elapsed_time": "4:17:00", "remaining_time": "0:26:06", "throughput": 4073.46, "total_tokens": 62814480} +{"current_steps": 108360, "total_steps": 119360, "loss": 0.2006, "lr": 2.565383139735356e-07, "epoch": 18.156836461126005, "percentage": 90.78, "elapsed_time": "4:17:01", "remaining_time": "0:26:05", "throughput": 4073.47, "total_tokens": 62817520} +{"current_steps": 108365, "total_steps": 119360, "loss": 0.4838, "lr": 2.5630718412274656e-07, "epoch": 18.157674262734584, "percentage": 90.79, "elapsed_time": "4:17:01", "remaining_time": "0:26:04", "throughput": 4073.48, "total_tokens": 62820368} +{"current_steps": 108370, "total_steps": 119360, "loss": 0.5845, "lr": 2.5607615569898046e-07, "epoch": 18.158512064343164, "percentage": 90.79, "elapsed_time": "4:17:02", "remaining_time": "0:26:04", "throughput": 4073.5, "total_tokens": 62823440} +{"current_steps": 108375, "total_steps": 119360, "loss": 0.3333, "lr": 2.558452287071733e-07, "epoch": 18.159349865951743, "percentage": 90.8, "elapsed_time": "4:17:03", "remaining_time": "0:26:03", "throughput": 4073.51, "total_tokens": 62826320} +{"current_steps": 108380, "total_steps": 119360, "loss": 0.4133, "lr": 2.5561440315226617e-07, "epoch": 18.160187667560322, "percentage": 90.8, "elapsed_time": "4:17:03", "remaining_time": "0:26:02", "throughput": 4073.52, "total_tokens": 62829200} +{"current_steps": 108385, "total_steps": 119360, "loss": 0.6349, "lr": 2.553836790391939e-07, "epoch": 18.1610254691689, "percentage": 90.81, "elapsed_time": "4:17:04", "remaining_time": "0:26:01", "throughput": 4073.53, "total_tokens": 62832080} +{"current_steps": 108390, "total_steps": 119360, "loss": 0.3768, "lr": 2.5515305637288823e-07, "epoch": 18.16186327077748, "percentage": 90.81, "elapsed_time": "4:17:05", "remaining_time": "0:26:01", "throughput": 4073.55, "total_tokens": 62835088} +{"current_steps": 108395, "total_steps": 119360, "loss": 0.3237, "lr": 2.549225351582801e-07, "epoch": 18.16270107238606, "percentage": 90.81, "elapsed_time": "4:17:05", "remaining_time": "0:26:00", "throughput": 4073.56, "total_tokens": 62838288} +{"current_steps": 108400, "total_steps": 119360, "loss": 0.4097, "lr": 2.546921154003007e-07, "epoch": 18.16353887399464, "percentage": 90.82, "elapsed_time": "4:17:06", "remaining_time": "0:25:59", "throughput": 4073.58, "total_tokens": 62841296} +{"current_steps": 108405, "total_steps": 119360, "loss": 0.3236, "lr": 2.5446179710387485e-07, "epoch": 18.16437667560322, "percentage": 90.82, "elapsed_time": "4:17:07", "remaining_time": "0:25:59", "throughput": 4073.59, "total_tokens": 62844144} +{"current_steps": 108410, "total_steps": 119360, "loss": 0.3982, "lr": 2.542315802739276e-07, "epoch": 18.165214477211798, "percentage": 90.83, "elapsed_time": "4:17:07", "remaining_time": "0:25:58", "throughput": 4073.6, "total_tokens": 62847248} +{"current_steps": 108415, "total_steps": 119360, "loss": 0.4991, "lr": 2.5400146491538045e-07, "epoch": 18.166052278820377, "percentage": 90.83, "elapsed_time": "4:17:08", "remaining_time": "0:25:57", "throughput": 4073.62, "total_tokens": 62850224} +{"current_steps": 108420, "total_steps": 119360, "loss": 0.3673, "lr": 2.5377145103315514e-07, "epoch": 18.166890080428953, "percentage": 90.83, "elapsed_time": "4:17:09", "remaining_time": "0:25:56", "throughput": 4073.63, "total_tokens": 62852912} +{"current_steps": 108425, "total_steps": 119360, "loss": 0.2708, "lr": 2.535415386321688e-07, "epoch": 18.167727882037532, "percentage": 90.84, "elapsed_time": "4:17:09", "remaining_time": "0:25:56", "throughput": 4073.63, "total_tokens": 62855632} +{"current_steps": 108430, "total_steps": 119360, "loss": 0.4235, "lr": 2.53311727717338e-07, "epoch": 18.16856568364611, "percentage": 90.84, "elapsed_time": "4:17:10", "remaining_time": "0:25:55", "throughput": 4073.64, "total_tokens": 62858544} +{"current_steps": 108435, "total_steps": 119360, "loss": 0.4307, "lr": 2.5308201829357506e-07, "epoch": 18.16940348525469, "percentage": 90.85, "elapsed_time": "4:17:11", "remaining_time": "0:25:54", "throughput": 4073.65, "total_tokens": 62861360} +{"current_steps": 108440, "total_steps": 119360, "loss": 0.5085, "lr": 2.52852410365792e-07, "epoch": 18.17024128686327, "percentage": 90.85, "elapsed_time": "4:17:11", "remaining_time": "0:25:54", "throughput": 4073.66, "total_tokens": 62864144} +{"current_steps": 108445, "total_steps": 119360, "loss": 0.3952, "lr": 2.5262290393889943e-07, "epoch": 18.17107908847185, "percentage": 90.86, "elapsed_time": "4:17:12", "remaining_time": "0:25:53", "throughput": 4073.66, "total_tokens": 62866768} +{"current_steps": 108450, "total_steps": 119360, "loss": 0.4809, "lr": 2.523934990178034e-07, "epoch": 18.17191689008043, "percentage": 90.86, "elapsed_time": "4:17:13", "remaining_time": "0:25:52", "throughput": 4073.67, "total_tokens": 62869776} +{"current_steps": 108455, "total_steps": 119360, "loss": 0.3544, "lr": 2.521641956074089e-07, "epoch": 18.172754691689008, "percentage": 90.86, "elapsed_time": "4:17:13", "remaining_time": "0:25:51", "throughput": 4073.67, "total_tokens": 62872464} +{"current_steps": 108460, "total_steps": 119360, "loss": 0.4571, "lr": 2.519349937126186e-07, "epoch": 18.173592493297587, "percentage": 90.87, "elapsed_time": "4:17:14", "remaining_time": "0:25:51", "throughput": 4073.69, "total_tokens": 62875600} +{"current_steps": 108465, "total_steps": 119360, "loss": 0.2342, "lr": 2.517058933383337e-07, "epoch": 18.174430294906166, "percentage": 90.87, "elapsed_time": "4:17:15", "remaining_time": "0:25:50", "throughput": 4073.71, "total_tokens": 62878800} +{"current_steps": 108470, "total_steps": 119360, "loss": 0.4211, "lr": 2.51476894489453e-07, "epoch": 18.175268096514746, "percentage": 90.88, "elapsed_time": "4:17:15", "remaining_time": "0:25:49", "throughput": 4073.72, "total_tokens": 62881616} +{"current_steps": 108475, "total_steps": 119360, "loss": 0.1491, "lr": 2.5124799717087256e-07, "epoch": 18.176105898123325, "percentage": 90.88, "elapsed_time": "4:17:16", "remaining_time": "0:25:48", "throughput": 4073.73, "total_tokens": 62884336} +{"current_steps": 108480, "total_steps": 119360, "loss": 0.3251, "lr": 2.5101920138748517e-07, "epoch": 18.176943699731904, "percentage": 90.88, "elapsed_time": "4:17:17", "remaining_time": "0:25:48", "throughput": 4073.74, "total_tokens": 62887056} +{"current_steps": 108485, "total_steps": 119360, "loss": 0.4191, "lr": 2.507905071441846e-07, "epoch": 18.177781501340483, "percentage": 90.89, "elapsed_time": "4:17:17", "remaining_time": "0:25:47", "throughput": 4073.75, "total_tokens": 62889904} +{"current_steps": 108490, "total_steps": 119360, "loss": 0.5473, "lr": 2.505619144458604e-07, "epoch": 18.178619302949063, "percentage": 90.89, "elapsed_time": "4:17:18", "remaining_time": "0:25:46", "throughput": 4073.75, "total_tokens": 62893040} +{"current_steps": 108495, "total_steps": 119360, "loss": 0.2758, "lr": 2.5033342329739975e-07, "epoch": 18.179457104557642, "percentage": 90.9, "elapsed_time": "4:17:19", "remaining_time": "0:25:46", "throughput": 4073.76, "total_tokens": 62895920} +{"current_steps": 108500, "total_steps": 119360, "loss": 0.3831, "lr": 2.5010503370368754e-07, "epoch": 18.18029490616622, "percentage": 90.9, "elapsed_time": "4:17:19", "remaining_time": "0:25:45", "throughput": 4073.78, "total_tokens": 62899120} +{"current_steps": 108505, "total_steps": 119360, "loss": 0.3998, "lr": 2.4987674566960883e-07, "epoch": 18.1811327077748, "percentage": 90.91, "elapsed_time": "4:17:20", "remaining_time": "0:25:44", "throughput": 4073.79, "total_tokens": 62902064} +{"current_steps": 108510, "total_steps": 119360, "loss": 0.2736, "lr": 2.4964855920004306e-07, "epoch": 18.18197050938338, "percentage": 90.91, "elapsed_time": "4:17:21", "remaining_time": "0:25:43", "throughput": 4073.8, "total_tokens": 62905168} +{"current_steps": 108515, "total_steps": 119360, "loss": 0.619, "lr": 2.494204742998696e-07, "epoch": 18.182808310991955, "percentage": 90.91, "elapsed_time": "4:17:22", "remaining_time": "0:25:43", "throughput": 4073.81, "total_tokens": 62907920} +{"current_steps": 108520, "total_steps": 119360, "loss": 0.332, "lr": 2.491924909739657e-07, "epoch": 18.183646112600535, "percentage": 90.92, "elapsed_time": "4:17:22", "remaining_time": "0:25:42", "throughput": 4073.83, "total_tokens": 62911088} +{"current_steps": 108525, "total_steps": 119360, "loss": 0.5801, "lr": 2.4896460922720575e-07, "epoch": 18.184483914209114, "percentage": 90.92, "elapsed_time": "4:17:23", "remaining_time": "0:25:41", "throughput": 4073.84, "total_tokens": 62914160} +{"current_steps": 108530, "total_steps": 119360, "loss": 0.2793, "lr": 2.4873682906446204e-07, "epoch": 18.185321715817693, "percentage": 90.93, "elapsed_time": "4:17:24", "remaining_time": "0:25:41", "throughput": 4073.85, "total_tokens": 62916912} +{"current_steps": 108535, "total_steps": 119360, "loss": 0.3444, "lr": 2.4850915049060565e-07, "epoch": 18.186159517426272, "percentage": 90.93, "elapsed_time": "4:17:24", "remaining_time": "0:25:40", "throughput": 4073.86, "total_tokens": 62919760} +{"current_steps": 108540, "total_steps": 119360, "loss": 0.3781, "lr": 2.482815735105026e-07, "epoch": 18.18699731903485, "percentage": 90.93, "elapsed_time": "4:17:25", "remaining_time": "0:25:39", "throughput": 4073.86, "total_tokens": 62922704} +{"current_steps": 108545, "total_steps": 119360, "loss": 0.4592, "lr": 2.480540981290208e-07, "epoch": 18.18783512064343, "percentage": 90.94, "elapsed_time": "4:17:26", "remaining_time": "0:25:38", "throughput": 4073.87, "total_tokens": 62925648} +{"current_steps": 108550, "total_steps": 119360, "loss": 0.3635, "lr": 2.4782672435102463e-07, "epoch": 18.18867292225201, "percentage": 90.94, "elapsed_time": "4:17:26", "remaining_time": "0:25:38", "throughput": 4073.88, "total_tokens": 62928592} +{"current_steps": 108555, "total_steps": 119360, "loss": 0.2286, "lr": 2.475994521813735e-07, "epoch": 18.18951072386059, "percentage": 90.95, "elapsed_time": "4:17:27", "remaining_time": "0:25:37", "throughput": 4073.88, "total_tokens": 62931248} +{"current_steps": 108560, "total_steps": 119360, "loss": 0.1284, "lr": 2.4737228162492687e-07, "epoch": 18.19034852546917, "percentage": 90.95, "elapsed_time": "4:17:28", "remaining_time": "0:25:36", "throughput": 4073.89, "total_tokens": 62934000} +{"current_steps": 108565, "total_steps": 119360, "loss": 0.514, "lr": 2.471452126865442e-07, "epoch": 18.191186327077748, "percentage": 90.96, "elapsed_time": "4:17:28", "remaining_time": "0:25:36", "throughput": 4073.9, "total_tokens": 62936816} +{"current_steps": 108570, "total_steps": 119360, "loss": 0.4015, "lr": 2.4691824537107833e-07, "epoch": 18.192024128686327, "percentage": 90.96, "elapsed_time": "4:17:29", "remaining_time": "0:25:35", "throughput": 4073.91, "total_tokens": 62940016} +{"current_steps": 108575, "total_steps": 119360, "loss": 0.3461, "lr": 2.4669137968338366e-07, "epoch": 18.192861930294907, "percentage": 90.96, "elapsed_time": "4:17:30", "remaining_time": "0:25:34", "throughput": 4073.92, "total_tokens": 62942864} +{"current_steps": 108580, "total_steps": 119360, "loss": 0.3924, "lr": 2.4646461562831015e-07, "epoch": 18.193699731903486, "percentage": 90.97, "elapsed_time": "4:17:30", "remaining_time": "0:25:33", "throughput": 4073.92, "total_tokens": 62945392} +{"current_steps": 108585, "total_steps": 119360, "loss": 0.3254, "lr": 2.462379532107062e-07, "epoch": 18.194537533512065, "percentage": 90.97, "elapsed_time": "4:17:31", "remaining_time": "0:25:33", "throughput": 4073.94, "total_tokens": 62948816} +{"current_steps": 108590, "total_steps": 119360, "loss": 0.4145, "lr": 2.460113924354185e-07, "epoch": 18.195375335120644, "percentage": 90.98, "elapsed_time": "4:17:32", "remaining_time": "0:25:32", "throughput": 4073.95, "total_tokens": 62951856} +{"current_steps": 108595, "total_steps": 119360, "loss": 0.1937, "lr": 2.4578493330729203e-07, "epoch": 18.196213136729224, "percentage": 90.98, "elapsed_time": "4:17:32", "remaining_time": "0:25:31", "throughput": 4073.97, "total_tokens": 62954832} +{"current_steps": 108600, "total_steps": 119360, "loss": 0.2603, "lr": 2.455585758311674e-07, "epoch": 18.197050938337803, "percentage": 90.99, "elapsed_time": "4:17:33", "remaining_time": "0:25:31", "throughput": 4073.97, "total_tokens": 62957648} +{"current_steps": 108605, "total_steps": 119360, "loss": 0.481, "lr": 2.45332320011884e-07, "epoch": 18.197888739946382, "percentage": 90.99, "elapsed_time": "4:17:34", "remaining_time": "0:25:30", "throughput": 4073.99, "total_tokens": 62960912} +{"current_steps": 108610, "total_steps": 119360, "loss": 0.2331, "lr": 2.451061658542825e-07, "epoch": 18.19872654155496, "percentage": 90.99, "elapsed_time": "4:17:35", "remaining_time": "0:25:29", "throughput": 4074.01, "total_tokens": 62964048} +{"current_steps": 108615, "total_steps": 119360, "loss": 0.3449, "lr": 2.4488011336319507e-07, "epoch": 18.199564343163537, "percentage": 91.0, "elapsed_time": "4:17:35", "remaining_time": "0:25:28", "throughput": 4074.02, "total_tokens": 62967056} +{"current_steps": 108620, "total_steps": 119360, "loss": 0.364, "lr": 2.4465416254345673e-07, "epoch": 18.200402144772116, "percentage": 91.0, "elapsed_time": "4:17:36", "remaining_time": "0:25:28", "throughput": 4074.03, "total_tokens": 62970000} +{"current_steps": 108625, "total_steps": 119360, "loss": 0.3823, "lr": 2.444283133998987e-07, "epoch": 18.201239946380696, "percentage": 91.01, "elapsed_time": "4:17:37", "remaining_time": "0:25:27", "throughput": 4074.04, "total_tokens": 62972912} +{"current_steps": 108630, "total_steps": 119360, "loss": 0.3478, "lr": 2.442025659373493e-07, "epoch": 18.202077747989275, "percentage": 91.01, "elapsed_time": "4:17:37", "remaining_time": "0:25:26", "throughput": 4074.05, "total_tokens": 62975696} +{"current_steps": 108635, "total_steps": 119360, "loss": 0.3206, "lr": 2.4397692016063566e-07, "epoch": 18.202915549597854, "percentage": 91.01, "elapsed_time": "4:17:38", "remaining_time": "0:25:26", "throughput": 4074.05, "total_tokens": 62978512} +{"current_steps": 108640, "total_steps": 119360, "loss": 0.3661, "lr": 2.43751376074583e-07, "epoch": 18.203753351206434, "percentage": 91.02, "elapsed_time": "4:17:39", "remaining_time": "0:25:25", "throughput": 4074.07, "total_tokens": 62981712} +{"current_steps": 108645, "total_steps": 119360, "loss": 0.1379, "lr": 2.435259336840118e-07, "epoch": 18.204591152815013, "percentage": 91.02, "elapsed_time": "4:17:39", "remaining_time": "0:25:24", "throughput": 4074.08, "total_tokens": 62984528} +{"current_steps": 108650, "total_steps": 119360, "loss": 0.2754, "lr": 2.4330059299374487e-07, "epoch": 18.205428954423592, "percentage": 91.03, "elapsed_time": "4:17:40", "remaining_time": "0:25:23", "throughput": 4074.09, "total_tokens": 62987472} +{"current_steps": 108655, "total_steps": 119360, "loss": 0.3308, "lr": 2.4307535400859893e-07, "epoch": 18.20626675603217, "percentage": 91.03, "elapsed_time": "4:17:41", "remaining_time": "0:25:23", "throughput": 4074.1, "total_tokens": 62990416} +{"current_steps": 108660, "total_steps": 119360, "loss": 0.423, "lr": 2.4285021673339016e-07, "epoch": 18.20710455764075, "percentage": 91.04, "elapsed_time": "4:17:41", "remaining_time": "0:25:22", "throughput": 4074.1, "total_tokens": 62993136} +{"current_steps": 108665, "total_steps": 119360, "loss": 0.3598, "lr": 2.4262518117293187e-07, "epoch": 18.20794235924933, "percentage": 91.04, "elapsed_time": "4:17:42", "remaining_time": "0:25:21", "throughput": 4074.11, "total_tokens": 62996208} +{"current_steps": 108670, "total_steps": 119360, "loss": 0.2647, "lr": 2.424002473320369e-07, "epoch": 18.20878016085791, "percentage": 91.04, "elapsed_time": "4:17:43", "remaining_time": "0:25:21", "throughput": 4074.12, "total_tokens": 62999120} +{"current_steps": 108675, "total_steps": 119360, "loss": 0.5453, "lr": 2.4217541521551314e-07, "epoch": 18.20961796246649, "percentage": 91.05, "elapsed_time": "4:17:43", "remaining_time": "0:25:20", "throughput": 4074.13, "total_tokens": 63002224} +{"current_steps": 108680, "total_steps": 119360, "loss": 0.4599, "lr": 2.4195068482816885e-07, "epoch": 18.210455764075068, "percentage": 91.05, "elapsed_time": "4:17:44", "remaining_time": "0:25:19", "throughput": 4074.14, "total_tokens": 63005232} +{"current_steps": 108685, "total_steps": 119360, "loss": 0.2265, "lr": 2.417260561748086e-07, "epoch": 18.211293565683647, "percentage": 91.06, "elapsed_time": "4:17:45", "remaining_time": "0:25:18", "throughput": 4074.15, "total_tokens": 63008080} +{"current_steps": 108690, "total_steps": 119360, "loss": 0.3724, "lr": 2.4150152926023576e-07, "epoch": 18.212131367292226, "percentage": 91.06, "elapsed_time": "4:17:46", "remaining_time": "0:25:18", "throughput": 4074.17, "total_tokens": 63011216} +{"current_steps": 108695, "total_steps": 119360, "loss": 0.435, "lr": 2.412771040892503e-07, "epoch": 18.212969168900806, "percentage": 91.06, "elapsed_time": "4:17:46", "remaining_time": "0:25:17", "throughput": 4074.18, "total_tokens": 63014064} +{"current_steps": 108700, "total_steps": 119360, "loss": 0.3545, "lr": 2.410527806666518e-07, "epoch": 18.213806970509385, "percentage": 91.07, "elapsed_time": "4:17:47", "remaining_time": "0:25:16", "throughput": 4074.19, "total_tokens": 63016784} +{"current_steps": 108705, "total_steps": 119360, "loss": 0.3833, "lr": 2.408285589972353e-07, "epoch": 18.214644772117964, "percentage": 91.07, "elapsed_time": "4:17:48", "remaining_time": "0:25:16", "throughput": 4074.19, "total_tokens": 63019632} +{"current_steps": 108710, "total_steps": 119360, "loss": 0.3228, "lr": 2.406044390857959e-07, "epoch": 18.21548257372654, "percentage": 91.08, "elapsed_time": "4:17:48", "remaining_time": "0:25:15", "throughput": 4074.2, "total_tokens": 63022256} +{"current_steps": 108715, "total_steps": 119360, "loss": 0.3343, "lr": 2.403804209371263e-07, "epoch": 18.21632037533512, "percentage": 91.08, "elapsed_time": "4:17:49", "remaining_time": "0:25:14", "throughput": 4074.2, "total_tokens": 63024912} +{"current_steps": 108720, "total_steps": 119360, "loss": 0.4995, "lr": 2.401565045560145e-07, "epoch": 18.2171581769437, "percentage": 91.09, "elapsed_time": "4:17:49", "remaining_time": "0:25:13", "throughput": 4074.21, "total_tokens": 63027920} +{"current_steps": 108725, "total_steps": 119360, "loss": 0.4266, "lr": 2.399326899472487e-07, "epoch": 18.217995978552278, "percentage": 91.09, "elapsed_time": "4:17:50", "remaining_time": "0:25:13", "throughput": 4074.21, "total_tokens": 63030704} +{"current_steps": 108730, "total_steps": 119360, "loss": 0.2882, "lr": 2.3970897711561583e-07, "epoch": 18.218833780160857, "percentage": 91.09, "elapsed_time": "4:17:51", "remaining_time": "0:25:12", "throughput": 4074.22, "total_tokens": 63033552} +{"current_steps": 108735, "total_steps": 119360, "loss": 0.3458, "lr": 2.394853660658975e-07, "epoch": 18.219671581769436, "percentage": 91.1, "elapsed_time": "4:17:51", "remaining_time": "0:25:11", "throughput": 4074.23, "total_tokens": 63036400} +{"current_steps": 108740, "total_steps": 119360, "loss": 0.509, "lr": 2.3926185680287595e-07, "epoch": 18.220509383378015, "percentage": 91.1, "elapsed_time": "4:17:52", "remaining_time": "0:25:11", "throughput": 4074.25, "total_tokens": 63039664} +{"current_steps": 108745, "total_steps": 119360, "loss": 0.5979, "lr": 2.3903844933132915e-07, "epoch": 18.221347184986595, "percentage": 91.11, "elapsed_time": "4:17:53", "remaining_time": "0:25:10", "throughput": 4074.26, "total_tokens": 63042480} +{"current_steps": 108750, "total_steps": 119360, "loss": 0.3328, "lr": 2.388151436560343e-07, "epoch": 18.222184986595174, "percentage": 91.11, "elapsed_time": "4:17:54", "remaining_time": "0:25:09", "throughput": 4074.27, "total_tokens": 63045648} +{"current_steps": 108755, "total_steps": 119360, "loss": 0.3965, "lr": 2.3859193978176653e-07, "epoch": 18.223022788203753, "percentage": 91.12, "elapsed_time": "4:17:54", "remaining_time": "0:25:08", "throughput": 4074.28, "total_tokens": 63048400} +{"current_steps": 108760, "total_steps": 119360, "loss": 0.5395, "lr": 2.3836883771329812e-07, "epoch": 18.223860589812332, "percentage": 91.12, "elapsed_time": "4:17:55", "remaining_time": "0:25:08", "throughput": 4074.28, "total_tokens": 63051216} +{"current_steps": 108765, "total_steps": 119360, "loss": 0.4133, "lr": 2.3814583745539798e-07, "epoch": 18.22469839142091, "percentage": 91.12, "elapsed_time": "4:17:56", "remaining_time": "0:25:07", "throughput": 4074.29, "total_tokens": 63053872} +{"current_steps": 108770, "total_steps": 119360, "loss": 0.4482, "lr": 2.379229390128357e-07, "epoch": 18.22553619302949, "percentage": 91.13, "elapsed_time": "4:17:56", "remaining_time": "0:25:06", "throughput": 4074.29, "total_tokens": 63056592} +{"current_steps": 108775, "total_steps": 119360, "loss": 0.0867, "lr": 2.3770014239037742e-07, "epoch": 18.22637399463807, "percentage": 91.13, "elapsed_time": "4:17:57", "remaining_time": "0:25:06", "throughput": 4074.31, "total_tokens": 63059632} +{"current_steps": 108780, "total_steps": 119360, "loss": 0.3363, "lr": 2.374774475927849e-07, "epoch": 18.22721179624665, "percentage": 91.14, "elapsed_time": "4:17:58", "remaining_time": "0:25:05", "throughput": 4074.31, "total_tokens": 63062416} +{"current_steps": 108785, "total_steps": 119360, "loss": 0.3702, "lr": 2.3725485462482157e-07, "epoch": 18.22804959785523, "percentage": 91.14, "elapsed_time": "4:17:58", "remaining_time": "0:25:04", "throughput": 4074.31, "total_tokens": 63065040} +{"current_steps": 108790, "total_steps": 119360, "loss": 0.4163, "lr": 2.370323634912458e-07, "epoch": 18.228887399463808, "percentage": 91.14, "elapsed_time": "4:17:59", "remaining_time": "0:25:03", "throughput": 4074.32, "total_tokens": 63067792} +{"current_steps": 108795, "total_steps": 119360, "loss": 0.5681, "lr": 2.3680997419681552e-07, "epoch": 18.229725201072387, "percentage": 91.15, "elapsed_time": "4:17:59", "remaining_time": "0:25:03", "throughput": 4074.33, "total_tokens": 63070576} +{"current_steps": 108800, "total_steps": 119360, "loss": 0.1667, "lr": 2.3658768674628462e-07, "epoch": 18.230563002680967, "percentage": 91.15, "elapsed_time": "4:18:00", "remaining_time": "0:25:02", "throughput": 4074.33, "total_tokens": 63073296} +{"current_steps": 108805, "total_steps": 119360, "loss": 0.1931, "lr": 2.363655011444077e-07, "epoch": 18.231400804289546, "percentage": 91.16, "elapsed_time": "4:18:01", "remaining_time": "0:25:01", "throughput": 4074.35, "total_tokens": 63076368} +{"current_steps": 108810, "total_steps": 119360, "loss": 0.428, "lr": 2.361434173959326e-07, "epoch": 18.23223860589812, "percentage": 91.16, "elapsed_time": "4:18:01", "remaining_time": "0:25:01", "throughput": 4074.36, "total_tokens": 63079152} +{"current_steps": 108815, "total_steps": 119360, "loss": 0.1909, "lr": 2.3592143550561054e-07, "epoch": 18.2330764075067, "percentage": 91.17, "elapsed_time": "4:18:02", "remaining_time": "0:25:00", "throughput": 4074.37, "total_tokens": 63082160} +{"current_steps": 108820, "total_steps": 119360, "loss": 0.4205, "lr": 2.3569955547818769e-07, "epoch": 18.23391420911528, "percentage": 91.17, "elapsed_time": "4:18:03", "remaining_time": "0:24:59", "throughput": 4074.38, "total_tokens": 63084976} +{"current_steps": 108825, "total_steps": 119360, "loss": 0.4035, "lr": 2.3547777731840582e-07, "epoch": 18.23475201072386, "percentage": 91.17, "elapsed_time": "4:18:03", "remaining_time": "0:24:58", "throughput": 4074.39, "total_tokens": 63087856} +{"current_steps": 108830, "total_steps": 119360, "loss": 0.2816, "lr": 2.3525610103100894e-07, "epoch": 18.23558981233244, "percentage": 91.18, "elapsed_time": "4:18:04", "remaining_time": "0:24:58", "throughput": 4074.4, "total_tokens": 63090736} +{"current_steps": 108835, "total_steps": 119360, "loss": 0.2932, "lr": 2.35034526620736e-07, "epoch": 18.236427613941018, "percentage": 91.18, "elapsed_time": "4:18:05", "remaining_time": "0:24:57", "throughput": 4074.41, "total_tokens": 63093328} +{"current_steps": 108840, "total_steps": 119360, "loss": 0.3619, "lr": 2.348130540923249e-07, "epoch": 18.237265415549597, "percentage": 91.19, "elapsed_time": "4:18:05", "remaining_time": "0:24:56", "throughput": 4074.41, "total_tokens": 63096048} +{"current_steps": 108845, "total_steps": 119360, "loss": 0.5099, "lr": 2.3459168345051075e-07, "epoch": 18.238103217158177, "percentage": 91.19, "elapsed_time": "4:18:06", "remaining_time": "0:24:56", "throughput": 4074.43, "total_tokens": 63099056} +{"current_steps": 108850, "total_steps": 119360, "loss": 0.2303, "lr": 2.3437041470002698e-07, "epoch": 18.238941018766756, "percentage": 91.19, "elapsed_time": "4:18:07", "remaining_time": "0:24:55", "throughput": 4074.44, "total_tokens": 63101936} +{"current_steps": 108855, "total_steps": 119360, "loss": 0.4057, "lr": 2.3414924784560422e-07, "epoch": 18.239778820375335, "percentage": 91.2, "elapsed_time": "4:18:07", "remaining_time": "0:24:54", "throughput": 4074.45, "total_tokens": 63104624} +{"current_steps": 108860, "total_steps": 119360, "loss": 0.1539, "lr": 2.3392818289197204e-07, "epoch": 18.240616621983914, "percentage": 91.2, "elapsed_time": "4:18:08", "remaining_time": "0:24:53", "throughput": 4074.46, "total_tokens": 63107504} +{"current_steps": 108865, "total_steps": 119360, "loss": 0.1934, "lr": 2.3370721984385725e-07, "epoch": 18.241454423592494, "percentage": 91.21, "elapsed_time": "4:18:09", "remaining_time": "0:24:53", "throughput": 4074.47, "total_tokens": 63110480} +{"current_steps": 108870, "total_steps": 119360, "loss": 0.4293, "lr": 2.334863587059827e-07, "epoch": 18.242292225201073, "percentage": 91.21, "elapsed_time": "4:18:09", "remaining_time": "0:24:52", "throughput": 4074.47, "total_tokens": 63113392} +{"current_steps": 108875, "total_steps": 119360, "loss": 0.4569, "lr": 2.3326559948307292e-07, "epoch": 18.243130026809652, "percentage": 91.22, "elapsed_time": "4:18:10", "remaining_time": "0:24:51", "throughput": 4074.48, "total_tokens": 63116144} +{"current_steps": 108880, "total_steps": 119360, "loss": 0.2776, "lr": 2.3304494217984752e-07, "epoch": 18.24396782841823, "percentage": 91.22, "elapsed_time": "4:18:11", "remaining_time": "0:24:51", "throughput": 4074.49, "total_tokens": 63119408} +{"current_steps": 108885, "total_steps": 119360, "loss": 0.3628, "lr": 2.3282438680102327e-07, "epoch": 18.24480563002681, "percentage": 91.22, "elapsed_time": "4:18:12", "remaining_time": "0:24:50", "throughput": 4074.5, "total_tokens": 63122608} +{"current_steps": 108890, "total_steps": 119360, "loss": 0.5898, "lr": 2.3260393335131637e-07, "epoch": 18.24564343163539, "percentage": 91.23, "elapsed_time": "4:18:12", "remaining_time": "0:24:49", "throughput": 4074.51, "total_tokens": 63125424} +{"current_steps": 108895, "total_steps": 119360, "loss": 0.4006, "lr": 2.323835818354414e-07, "epoch": 18.24648123324397, "percentage": 91.23, "elapsed_time": "4:18:13", "remaining_time": "0:24:48", "throughput": 4074.52, "total_tokens": 63128400} +{"current_steps": 108900, "total_steps": 119360, "loss": 0.2341, "lr": 2.321633322581085e-07, "epoch": 18.24731903485255, "percentage": 91.24, "elapsed_time": "4:18:14", "remaining_time": "0:24:48", "throughput": 4074.54, "total_tokens": 63131312} +{"current_steps": 108905, "total_steps": 119360, "loss": 0.2505, "lr": 2.3194318462402776e-07, "epoch": 18.248156836461128, "percentage": 91.24, "elapsed_time": "4:18:14", "remaining_time": "0:24:47", "throughput": 4074.55, "total_tokens": 63134352} +{"current_steps": 108910, "total_steps": 119360, "loss": 0.2489, "lr": 2.3172313893790655e-07, "epoch": 18.248994638069703, "percentage": 91.24, "elapsed_time": "4:18:15", "remaining_time": "0:24:46", "throughput": 4074.57, "total_tokens": 63137552} +{"current_steps": 108915, "total_steps": 119360, "loss": 0.2185, "lr": 2.3150319520444887e-07, "epoch": 18.249832439678283, "percentage": 91.25, "elapsed_time": "4:18:16", "remaining_time": "0:24:46", "throughput": 4074.57, "total_tokens": 63140368} +{"current_steps": 108920, "total_steps": 119360, "loss": 0.3605, "lr": 2.3128335342835817e-07, "epoch": 18.250670241286862, "percentage": 91.25, "elapsed_time": "4:18:16", "remaining_time": "0:24:45", "throughput": 4074.58, "total_tokens": 63143120} +{"current_steps": 108925, "total_steps": 119360, "loss": 0.3051, "lr": 2.3106361361433517e-07, "epoch": 18.25150804289544, "percentage": 91.26, "elapsed_time": "4:18:17", "remaining_time": "0:24:44", "throughput": 4074.59, "total_tokens": 63146224} +{"current_steps": 108930, "total_steps": 119360, "loss": 0.2507, "lr": 2.3084397576707607e-07, "epoch": 18.25234584450402, "percentage": 91.26, "elapsed_time": "4:18:18", "remaining_time": "0:24:43", "throughput": 4074.59, "total_tokens": 63148944} +{"current_steps": 108935, "total_steps": 119360, "loss": 0.2563, "lr": 2.3062443989128048e-07, "epoch": 18.2531836461126, "percentage": 91.27, "elapsed_time": "4:18:18", "remaining_time": "0:24:43", "throughput": 4074.6, "total_tokens": 63151728} +{"current_steps": 108940, "total_steps": 119360, "loss": 0.403, "lr": 2.3040500599164018e-07, "epoch": 18.25402144772118, "percentage": 91.27, "elapsed_time": "4:18:19", "remaining_time": "0:24:42", "throughput": 4074.61, "total_tokens": 63154896} +{"current_steps": 108945, "total_steps": 119360, "loss": 0.2639, "lr": 2.3018567407284698e-07, "epoch": 18.25485924932976, "percentage": 91.27, "elapsed_time": "4:18:20", "remaining_time": "0:24:41", "throughput": 4074.63, "total_tokens": 63157936} +{"current_steps": 108950, "total_steps": 119360, "loss": 0.3441, "lr": 2.29966444139591e-07, "epoch": 18.255697050938338, "percentage": 91.28, "elapsed_time": "4:18:20", "remaining_time": "0:24:41", "throughput": 4074.63, "total_tokens": 63160688} +{"current_steps": 108955, "total_steps": 119360, "loss": 0.3831, "lr": 2.2974731619655967e-07, "epoch": 18.256534852546917, "percentage": 91.28, "elapsed_time": "4:18:21", "remaining_time": "0:24:40", "throughput": 4074.65, "total_tokens": 63163568} +{"current_steps": 108960, "total_steps": 119360, "loss": 0.4929, "lr": 2.2952829024843858e-07, "epoch": 18.257372654155496, "percentage": 91.29, "elapsed_time": "4:18:22", "remaining_time": "0:24:39", "throughput": 4074.65, "total_tokens": 63166288} +{"current_steps": 108965, "total_steps": 119360, "loss": 0.2111, "lr": 2.2930936629991018e-07, "epoch": 18.258210455764075, "percentage": 91.29, "elapsed_time": "4:18:22", "remaining_time": "0:24:38", "throughput": 4074.66, "total_tokens": 63169104} +{"current_steps": 108970, "total_steps": 119360, "loss": 0.244, "lr": 2.2909054435565625e-07, "epoch": 18.259048257372655, "percentage": 91.3, "elapsed_time": "4:18:23", "remaining_time": "0:24:38", "throughput": 4074.67, "total_tokens": 63171920} +{"current_steps": 108975, "total_steps": 119360, "loss": 0.526, "lr": 2.2887182442035417e-07, "epoch": 18.259886058981234, "percentage": 91.3, "elapsed_time": "4:18:24", "remaining_time": "0:24:37", "throughput": 4074.68, "total_tokens": 63174736} +{"current_steps": 108980, "total_steps": 119360, "loss": 0.1891, "lr": 2.2865320649868129e-07, "epoch": 18.260723860589813, "percentage": 91.3, "elapsed_time": "4:18:24", "remaining_time": "0:24:36", "throughput": 4074.7, "total_tokens": 63177872} +{"current_steps": 108985, "total_steps": 119360, "loss": 0.552, "lr": 2.2843469059531332e-07, "epoch": 18.261561662198392, "percentage": 91.31, "elapsed_time": "4:18:25", "remaining_time": "0:24:36", "throughput": 4074.71, "total_tokens": 63180944} +{"current_steps": 108990, "total_steps": 119360, "loss": 0.2514, "lr": 2.2821627671491985e-07, "epoch": 18.26239946380697, "percentage": 91.31, "elapsed_time": "4:18:26", "remaining_time": "0:24:35", "throughput": 4074.72, "total_tokens": 63183856} +{"current_steps": 108995, "total_steps": 119360, "loss": 0.3603, "lr": 2.2799796486217218e-07, "epoch": 18.26323726541555, "percentage": 91.32, "elapsed_time": "4:18:26", "remaining_time": "0:24:34", "throughput": 4074.73, "total_tokens": 63186640} +{"current_steps": 109000, "total_steps": 119360, "loss": 0.2797, "lr": 2.2777975504173821e-07, "epoch": 18.26407506702413, "percentage": 91.32, "elapsed_time": "4:18:27", "remaining_time": "0:24:33", "throughput": 4074.74, "total_tokens": 63189680} +{"current_steps": 109005, "total_steps": 119360, "loss": 0.253, "lr": 2.2756164725828367e-07, "epoch": 18.264912868632706, "percentage": 91.32, "elapsed_time": "4:18:28", "remaining_time": "0:24:33", "throughput": 4074.75, "total_tokens": 63192496} +{"current_steps": 109010, "total_steps": 119360, "loss": 0.467, "lr": 2.2734364151647148e-07, "epoch": 18.265750670241285, "percentage": 91.33, "elapsed_time": "4:18:29", "remaining_time": "0:24:32", "throughput": 4074.76, "total_tokens": 63195440} +{"current_steps": 109015, "total_steps": 119360, "loss": 0.4109, "lr": 2.271257378209635e-07, "epoch": 18.266588471849865, "percentage": 91.33, "elapsed_time": "4:18:29", "remaining_time": "0:24:31", "throughput": 4074.77, "total_tokens": 63198608} +{"current_steps": 109020, "total_steps": 119360, "loss": 0.3549, "lr": 2.2690793617641871e-07, "epoch": 18.267426273458444, "percentage": 91.34, "elapsed_time": "4:18:30", "remaining_time": "0:24:31", "throughput": 4074.78, "total_tokens": 63201296} +{"current_steps": 109025, "total_steps": 119360, "loss": 0.2689, "lr": 2.2669023658749346e-07, "epoch": 18.268264075067023, "percentage": 91.34, "elapsed_time": "4:18:31", "remaining_time": "0:24:30", "throughput": 4074.79, "total_tokens": 63204208} +{"current_steps": 109030, "total_steps": 119360, "loss": 0.5349, "lr": 2.2647263905884397e-07, "epoch": 18.269101876675602, "percentage": 91.35, "elapsed_time": "4:18:31", "remaining_time": "0:24:29", "throughput": 4074.79, "total_tokens": 63207056} +{"current_steps": 109035, "total_steps": 119360, "loss": 0.4685, "lr": 2.262551435951199e-07, "epoch": 18.26993967828418, "percentage": 91.35, "elapsed_time": "4:18:32", "remaining_time": "0:24:28", "throughput": 4074.8, "total_tokens": 63209936} +{"current_steps": 109040, "total_steps": 119360, "loss": 0.325, "lr": 2.260377502009753e-07, "epoch": 18.27077747989276, "percentage": 91.35, "elapsed_time": "4:18:33", "remaining_time": "0:24:28", "throughput": 4074.82, "total_tokens": 63212880} +{"current_steps": 109045, "total_steps": 119360, "loss": 0.617, "lr": 2.2582045888105587e-07, "epoch": 18.27161528150134, "percentage": 91.36, "elapsed_time": "4:18:33", "remaining_time": "0:24:27", "throughput": 4074.83, "total_tokens": 63215792} +{"current_steps": 109050, "total_steps": 119360, "loss": 0.2356, "lr": 2.2560326964000789e-07, "epoch": 18.27245308310992, "percentage": 91.36, "elapsed_time": "4:18:34", "remaining_time": "0:24:26", "throughput": 4074.83, "total_tokens": 63218512} +{"current_steps": 109055, "total_steps": 119360, "loss": 0.3783, "lr": 2.2538618248247545e-07, "epoch": 18.2732908847185, "percentage": 91.37, "elapsed_time": "4:18:35", "remaining_time": "0:24:26", "throughput": 4074.84, "total_tokens": 63221424} +{"current_steps": 109060, "total_steps": 119360, "loss": 0.3344, "lr": 2.251691974131004e-07, "epoch": 18.274128686327078, "percentage": 91.37, "elapsed_time": "4:18:35", "remaining_time": "0:24:25", "throughput": 4074.84, "total_tokens": 63224112} +{"current_steps": 109065, "total_steps": 119360, "loss": 0.337, "lr": 2.2495231443652234e-07, "epoch": 18.274966487935657, "percentage": 91.37, "elapsed_time": "4:18:36", "remaining_time": "0:24:24", "throughput": 4074.86, "total_tokens": 63227152} +{"current_steps": 109070, "total_steps": 119360, "loss": 0.0584, "lr": 2.247355335573781e-07, "epoch": 18.275804289544237, "percentage": 91.38, "elapsed_time": "4:18:37", "remaining_time": "0:24:23", "throughput": 4074.86, "total_tokens": 63230000} +{"current_steps": 109075, "total_steps": 119360, "loss": 0.2889, "lr": 2.245188547803029e-07, "epoch": 18.276642091152816, "percentage": 91.38, "elapsed_time": "4:18:37", "remaining_time": "0:24:23", "throughput": 4074.87, "total_tokens": 63232688} +{"current_steps": 109080, "total_steps": 119360, "loss": 0.2665, "lr": 2.2430227810992965e-07, "epoch": 18.277479892761395, "percentage": 91.39, "elapsed_time": "4:18:38", "remaining_time": "0:24:22", "throughput": 4074.88, "total_tokens": 63235472} +{"current_steps": 109085, "total_steps": 119360, "loss": 0.3262, "lr": 2.240858035508897e-07, "epoch": 18.278317694369974, "percentage": 91.39, "elapsed_time": "4:18:39", "remaining_time": "0:24:21", "throughput": 4074.89, "total_tokens": 63238448} +{"current_steps": 109090, "total_steps": 119360, "loss": 0.2437, "lr": 2.2386943110781047e-07, "epoch": 18.279155495978554, "percentage": 91.4, "elapsed_time": "4:18:39", "remaining_time": "0:24:21", "throughput": 4074.91, "total_tokens": 63241680} +{"current_steps": 109095, "total_steps": 119360, "loss": 0.4295, "lr": 2.2365316078531818e-07, "epoch": 18.279993297587133, "percentage": 91.4, "elapsed_time": "4:18:40", "remaining_time": "0:24:20", "throughput": 4074.93, "total_tokens": 63244880} +{"current_steps": 109100, "total_steps": 119360, "loss": 0.2346, "lr": 2.234369925880392e-07, "epoch": 18.280831099195712, "percentage": 91.4, "elapsed_time": "4:18:41", "remaining_time": "0:24:19", "throughput": 4074.93, "total_tokens": 63247664} +{"current_steps": 109105, "total_steps": 119360, "loss": 0.5401, "lr": 2.2322092652059313e-07, "epoch": 18.281668900804288, "percentage": 91.41, "elapsed_time": "4:18:41", "remaining_time": "0:24:18", "throughput": 4074.94, "total_tokens": 63250640} +{"current_steps": 109110, "total_steps": 119360, "loss": 0.3409, "lr": 2.2300496258760073e-07, "epoch": 18.282506702412867, "percentage": 91.41, "elapsed_time": "4:18:42", "remaining_time": "0:24:18", "throughput": 4074.95, "total_tokens": 63253456} +{"current_steps": 109115, "total_steps": 119360, "loss": 0.1507, "lr": 2.2278910079367944e-07, "epoch": 18.283344504021446, "percentage": 91.42, "elapsed_time": "4:18:43", "remaining_time": "0:24:17", "throughput": 4074.96, "total_tokens": 63256304} +{"current_steps": 109120, "total_steps": 119360, "loss": 0.3099, "lr": 2.2257334114344443e-07, "epoch": 18.284182305630026, "percentage": 91.42, "elapsed_time": "4:18:43", "remaining_time": "0:24:16", "throughput": 4074.97, "total_tokens": 63259088} +{"current_steps": 109125, "total_steps": 119360, "loss": 0.3749, "lr": 2.2235768364150977e-07, "epoch": 18.285020107238605, "percentage": 91.43, "elapsed_time": "4:18:44", "remaining_time": "0:24:16", "throughput": 4074.98, "total_tokens": 63261968} +{"current_steps": 109130, "total_steps": 119360, "loss": 0.3801, "lr": 2.221421282924857e-07, "epoch": 18.285857908847184, "percentage": 91.43, "elapsed_time": "4:18:45", "remaining_time": "0:24:15", "throughput": 4075.0, "total_tokens": 63265168} +{"current_steps": 109135, "total_steps": 119360, "loss": 0.3094, "lr": 2.2192667510098243e-07, "epoch": 18.286695710455763, "percentage": 91.43, "elapsed_time": "4:18:45", "remaining_time": "0:24:14", "throughput": 4075.0, "total_tokens": 63267952} +{"current_steps": 109140, "total_steps": 119360, "loss": 0.1467, "lr": 2.2171132407160457e-07, "epoch": 18.287533512064343, "percentage": 91.44, "elapsed_time": "4:18:46", "remaining_time": "0:24:13", "throughput": 4075.01, "total_tokens": 63270736} +{"current_steps": 109145, "total_steps": 119360, "loss": 0.3951, "lr": 2.21496075208959e-07, "epoch": 18.288371313672922, "percentage": 91.44, "elapsed_time": "4:18:47", "remaining_time": "0:24:13", "throughput": 4075.03, "total_tokens": 63273840} +{"current_steps": 109150, "total_steps": 119360, "loss": 0.3861, "lr": 2.2128092851764593e-07, "epoch": 18.2892091152815, "percentage": 91.45, "elapsed_time": "4:18:47", "remaining_time": "0:24:12", "throughput": 4075.03, "total_tokens": 63276592} +{"current_steps": 109155, "total_steps": 119360, "loss": 0.4099, "lr": 2.2106588400226614e-07, "epoch": 18.29004691689008, "percentage": 91.45, "elapsed_time": "4:18:48", "remaining_time": "0:24:11", "throughput": 4075.05, "total_tokens": 63280048} +{"current_steps": 109160, "total_steps": 119360, "loss": 0.4645, "lr": 2.2085094166741815e-07, "epoch": 18.29088471849866, "percentage": 91.45, "elapsed_time": "4:18:49", "remaining_time": "0:24:11", "throughput": 4075.06, "total_tokens": 63282896} +{"current_steps": 109165, "total_steps": 119360, "loss": 0.3071, "lr": 2.2063610151769776e-07, "epoch": 18.29172252010724, "percentage": 91.46, "elapsed_time": "4:18:49", "remaining_time": "0:24:10", "throughput": 4075.07, "total_tokens": 63285744} +{"current_steps": 109170, "total_steps": 119360, "loss": 0.444, "lr": 2.2042136355769793e-07, "epoch": 18.29256032171582, "percentage": 91.46, "elapsed_time": "4:18:50", "remaining_time": "0:24:09", "throughput": 4075.08, "total_tokens": 63288560} +{"current_steps": 109175, "total_steps": 119360, "loss": 0.281, "lr": 2.2020672779201058e-07, "epoch": 18.293398123324398, "percentage": 91.47, "elapsed_time": "4:18:51", "remaining_time": "0:24:08", "throughput": 4075.09, "total_tokens": 63291600} +{"current_steps": 109180, "total_steps": 119360, "loss": 0.3593, "lr": 2.1999219422522423e-07, "epoch": 18.294235924932977, "percentage": 91.47, "elapsed_time": "4:18:51", "remaining_time": "0:24:08", "throughput": 4075.09, "total_tokens": 63294160} +{"current_steps": 109185, "total_steps": 119360, "loss": 0.0851, "lr": 2.1977776286192686e-07, "epoch": 18.295073726541556, "percentage": 91.48, "elapsed_time": "4:18:52", "remaining_time": "0:24:07", "throughput": 4075.11, "total_tokens": 63297232} +{"current_steps": 109190, "total_steps": 119360, "loss": 0.4715, "lr": 2.1956343370670376e-07, "epoch": 18.295911528150135, "percentage": 91.48, "elapsed_time": "4:18:53", "remaining_time": "0:24:06", "throughput": 4075.12, "total_tokens": 63300432} +{"current_steps": 109195, "total_steps": 119360, "loss": 0.4136, "lr": 2.1934920676413563e-07, "epoch": 18.296749329758715, "percentage": 91.48, "elapsed_time": "4:18:54", "remaining_time": "0:24:06", "throughput": 4075.13, "total_tokens": 63303280} +{"current_steps": 109200, "total_steps": 119360, "loss": 0.4186, "lr": 2.1913508203880328e-07, "epoch": 18.297587131367294, "percentage": 91.49, "elapsed_time": "4:18:54", "remaining_time": "0:24:05", "throughput": 4075.13, "total_tokens": 63306032} +{"current_steps": 109205, "total_steps": 119360, "loss": 0.4894, "lr": 2.1892105953528753e-07, "epoch": 18.29842493297587, "percentage": 91.49, "elapsed_time": "4:18:55", "remaining_time": "0:24:04", "throughput": 4075.13, "total_tokens": 63308560} +{"current_steps": 109210, "total_steps": 119360, "loss": 0.6191, "lr": 2.187071392581619e-07, "epoch": 18.29926273458445, "percentage": 91.5, "elapsed_time": "4:18:55", "remaining_time": "0:24:03", "throughput": 4075.14, "total_tokens": 63311248} +{"current_steps": 109215, "total_steps": 119360, "loss": 0.3516, "lr": 2.1849332121200107e-07, "epoch": 18.30010053619303, "percentage": 91.5, "elapsed_time": "4:18:56", "remaining_time": "0:24:03", "throughput": 4075.14, "total_tokens": 63314000} +{"current_steps": 109220, "total_steps": 119360, "loss": 0.4711, "lr": 2.1827960540137693e-07, "epoch": 18.300938337801608, "percentage": 91.5, "elapsed_time": "4:18:57", "remaining_time": "0:24:02", "throughput": 4075.16, "total_tokens": 63316976} +{"current_steps": 109225, "total_steps": 119360, "loss": 0.2039, "lr": 2.1806599183085918e-07, "epoch": 18.301776139410187, "percentage": 91.51, "elapsed_time": "4:18:57", "remaining_time": "0:24:01", "throughput": 4075.17, "total_tokens": 63319952} +{"current_steps": 109230, "total_steps": 119360, "loss": 0.4914, "lr": 2.1785248050501473e-07, "epoch": 18.302613941018766, "percentage": 91.51, "elapsed_time": "4:18:58", "remaining_time": "0:24:01", "throughput": 4075.18, "total_tokens": 63322864} +{"current_steps": 109235, "total_steps": 119360, "loss": 0.4294, "lr": 2.1763907142840878e-07, "epoch": 18.303451742627345, "percentage": 91.52, "elapsed_time": "4:18:59", "remaining_time": "0:24:00", "throughput": 4075.18, "total_tokens": 63325648} +{"current_steps": 109240, "total_steps": 119360, "loss": 0.3566, "lr": 2.1742576460560494e-07, "epoch": 18.304289544235925, "percentage": 91.52, "elapsed_time": "4:19:00", "remaining_time": "0:23:59", "throughput": 4075.2, "total_tokens": 63328624} +{"current_steps": 109245, "total_steps": 119360, "loss": 0.2885, "lr": 2.172125600411634e-07, "epoch": 18.305127345844504, "percentage": 91.53, "elapsed_time": "4:19:00", "remaining_time": "0:23:58", "throughput": 4075.21, "total_tokens": 63331504} +{"current_steps": 109250, "total_steps": 119360, "loss": 0.4422, "lr": 2.1699945773964393e-07, "epoch": 18.305965147453083, "percentage": 91.53, "elapsed_time": "4:19:01", "remaining_time": "0:23:58", "throughput": 4075.22, "total_tokens": 63334384} +{"current_steps": 109255, "total_steps": 119360, "loss": 0.1364, "lr": 2.1678645770560114e-07, "epoch": 18.306802949061662, "percentage": 91.53, "elapsed_time": "4:19:02", "remaining_time": "0:23:57", "throughput": 4075.24, "total_tokens": 63337360} +{"current_steps": 109260, "total_steps": 119360, "loss": 0.4228, "lr": 2.165735599435892e-07, "epoch": 18.30764075067024, "percentage": 91.54, "elapsed_time": "4:19:02", "remaining_time": "0:23:56", "throughput": 4075.25, "total_tokens": 63340272} +{"current_steps": 109265, "total_steps": 119360, "loss": 0.5978, "lr": 2.1636076445816333e-07, "epoch": 18.30847855227882, "percentage": 91.54, "elapsed_time": "4:19:03", "remaining_time": "0:23:56", "throughput": 4075.26, "total_tokens": 63343120} +{"current_steps": 109270, "total_steps": 119360, "loss": 0.8505, "lr": 2.1614807125386994e-07, "epoch": 18.3093163538874, "percentage": 91.55, "elapsed_time": "4:19:04", "remaining_time": "0:23:55", "throughput": 4075.26, "total_tokens": 63345936} +{"current_steps": 109275, "total_steps": 119360, "loss": 0.2673, "lr": 2.1593548033525813e-07, "epoch": 18.31015415549598, "percentage": 91.55, "elapsed_time": "4:19:04", "remaining_time": "0:23:54", "throughput": 4075.27, "total_tokens": 63348592} +{"current_steps": 109280, "total_steps": 119360, "loss": 0.4064, "lr": 2.1572299170687316e-07, "epoch": 18.31099195710456, "percentage": 91.55, "elapsed_time": "4:19:05", "remaining_time": "0:23:53", "throughput": 4075.27, "total_tokens": 63351280} +{"current_steps": 109285, "total_steps": 119360, "loss": 0.2683, "lr": 2.1551060537325862e-07, "epoch": 18.311829758713138, "percentage": 91.56, "elapsed_time": "4:19:05", "remaining_time": "0:23:53", "throughput": 4075.28, "total_tokens": 63354032} +{"current_steps": 109290, "total_steps": 119360, "loss": 0.2971, "lr": 2.152983213389559e-07, "epoch": 18.312667560321717, "percentage": 91.56, "elapsed_time": "4:19:06", "remaining_time": "0:23:52", "throughput": 4075.29, "total_tokens": 63356976} +{"current_steps": 109295, "total_steps": 119360, "loss": 0.3338, "lr": 2.1508613960850355e-07, "epoch": 18.313505361930297, "percentage": 91.57, "elapsed_time": "4:19:07", "remaining_time": "0:23:51", "throughput": 4075.3, "total_tokens": 63359760} +{"current_steps": 109300, "total_steps": 119360, "loss": 0.4507, "lr": 2.1487406018643796e-07, "epoch": 18.314343163538872, "percentage": 91.57, "elapsed_time": "4:19:07", "remaining_time": "0:23:51", "throughput": 4075.3, "total_tokens": 63362512} +{"current_steps": 109305, "total_steps": 119360, "loss": 0.175, "lr": 2.146620830772933e-07, "epoch": 18.31518096514745, "percentage": 91.58, "elapsed_time": "4:19:08", "remaining_time": "0:23:50", "throughput": 4075.3, "total_tokens": 63365168} +{"current_steps": 109310, "total_steps": 119360, "loss": 0.3892, "lr": 2.144502082856037e-07, "epoch": 18.31601876675603, "percentage": 91.58, "elapsed_time": "4:19:09", "remaining_time": "0:23:49", "throughput": 4075.31, "total_tokens": 63368112} +{"current_steps": 109315, "total_steps": 119360, "loss": 0.4456, "lr": 2.1423843581589832e-07, "epoch": 18.31685656836461, "percentage": 91.58, "elapsed_time": "4:19:09", "remaining_time": "0:23:48", "throughput": 4075.33, "total_tokens": 63371312} +{"current_steps": 109320, "total_steps": 119360, "loss": 0.142, "lr": 2.1402676567270463e-07, "epoch": 18.31769436997319, "percentage": 91.59, "elapsed_time": "4:19:10", "remaining_time": "0:23:48", "throughput": 4075.35, "total_tokens": 63374480} +{"current_steps": 109325, "total_steps": 119360, "loss": 0.4127, "lr": 2.1381519786054904e-07, "epoch": 18.31853217158177, "percentage": 91.59, "elapsed_time": "4:19:11", "remaining_time": "0:23:47", "throughput": 4075.36, "total_tokens": 63377520} +{"current_steps": 109330, "total_steps": 119360, "loss": 0.4788, "lr": 2.1360373238395516e-07, "epoch": 18.319369973190348, "percentage": 91.6, "elapsed_time": "4:19:12", "remaining_time": "0:23:46", "throughput": 4075.37, "total_tokens": 63380528} +{"current_steps": 109335, "total_steps": 119360, "loss": 0.4126, "lr": 2.133923692474449e-07, "epoch": 18.320207774798927, "percentage": 91.6, "elapsed_time": "4:19:12", "remaining_time": "0:23:46", "throughput": 4075.38, "total_tokens": 63383568} +{"current_steps": 109340, "total_steps": 119360, "loss": 0.4294, "lr": 2.1318110845553686e-07, "epoch": 18.321045576407506, "percentage": 91.61, "elapsed_time": "4:19:13", "remaining_time": "0:23:45", "throughput": 4075.4, "total_tokens": 63386544} +{"current_steps": 109345, "total_steps": 119360, "loss": 0.3538, "lr": 2.1296995001274746e-07, "epoch": 18.321883378016086, "percentage": 91.61, "elapsed_time": "4:19:14", "remaining_time": "0:23:44", "throughput": 4075.41, "total_tokens": 63389360} +{"current_steps": 109350, "total_steps": 119360, "loss": 0.3407, "lr": 2.1275889392359307e-07, "epoch": 18.322721179624665, "percentage": 91.61, "elapsed_time": "4:19:14", "remaining_time": "0:23:43", "throughput": 4075.42, "total_tokens": 63392304} +{"current_steps": 109355, "total_steps": 119360, "loss": 0.324, "lr": 2.1254794019258562e-07, "epoch": 18.323558981233244, "percentage": 91.62, "elapsed_time": "4:19:15", "remaining_time": "0:23:43", "throughput": 4075.42, "total_tokens": 63395120} +{"current_steps": 109360, "total_steps": 119360, "loss": 0.3362, "lr": 2.12337088824236e-07, "epoch": 18.324396782841823, "percentage": 91.62, "elapsed_time": "4:19:16", "remaining_time": "0:23:42", "throughput": 4075.43, "total_tokens": 63397968} +{"current_steps": 109365, "total_steps": 119360, "loss": 0.2139, "lr": 2.1212633982305052e-07, "epoch": 18.325234584450403, "percentage": 91.63, "elapsed_time": "4:19:16", "remaining_time": "0:23:41", "throughput": 4075.45, "total_tokens": 63401040} +{"current_steps": 109370, "total_steps": 119360, "loss": 0.2358, "lr": 2.1191569319353898e-07, "epoch": 18.326072386058982, "percentage": 91.63, "elapsed_time": "4:19:17", "remaining_time": "0:23:41", "throughput": 4075.45, "total_tokens": 63403760} +{"current_steps": 109375, "total_steps": 119360, "loss": 0.2576, "lr": 2.1170514894020221e-07, "epoch": 18.32691018766756, "percentage": 91.63, "elapsed_time": "4:19:18", "remaining_time": "0:23:40", "throughput": 4075.45, "total_tokens": 63406416} +{"current_steps": 109380, "total_steps": 119360, "loss": 0.1964, "lr": 2.1149470706754328e-07, "epoch": 18.32774798927614, "percentage": 91.64, "elapsed_time": "4:19:18", "remaining_time": "0:23:39", "throughput": 4075.46, "total_tokens": 63409104} +{"current_steps": 109385, "total_steps": 119360, "loss": 0.5293, "lr": 2.1128436758006133e-07, "epoch": 18.32858579088472, "percentage": 91.64, "elapsed_time": "4:19:19", "remaining_time": "0:23:38", "throughput": 4075.48, "total_tokens": 63412368} +{"current_steps": 109390, "total_steps": 119360, "loss": 0.3066, "lr": 2.110741304822539e-07, "epoch": 18.3294235924933, "percentage": 91.65, "elapsed_time": "4:19:20", "remaining_time": "0:23:38", "throughput": 4075.5, "total_tokens": 63415504} +{"current_steps": 109395, "total_steps": 119360, "loss": 0.1402, "lr": 2.1086399577861628e-07, "epoch": 18.33026139410188, "percentage": 91.65, "elapsed_time": "4:19:20", "remaining_time": "0:23:37", "throughput": 4075.51, "total_tokens": 63418448} +{"current_steps": 109400, "total_steps": 119360, "loss": 0.315, "lr": 2.1065396347364153e-07, "epoch": 18.331099195710454, "percentage": 91.66, "elapsed_time": "4:19:21", "remaining_time": "0:23:36", "throughput": 4075.52, "total_tokens": 63421488} +{"current_steps": 109405, "total_steps": 119360, "loss": 0.2198, "lr": 2.104440335718194e-07, "epoch": 18.331936997319033, "percentage": 91.66, "elapsed_time": "4:19:22", "remaining_time": "0:23:36", "throughput": 4075.53, "total_tokens": 63424720} +{"current_steps": 109410, "total_steps": 119360, "loss": 0.2298, "lr": 2.1023420607763966e-07, "epoch": 18.332774798927613, "percentage": 91.66, "elapsed_time": "4:19:23", "remaining_time": "0:23:35", "throughput": 4075.54, "total_tokens": 63427696} +{"current_steps": 109415, "total_steps": 119360, "loss": 0.349, "lr": 2.1002448099558926e-07, "epoch": 18.333612600536192, "percentage": 91.67, "elapsed_time": "4:19:23", "remaining_time": "0:23:34", "throughput": 4075.55, "total_tokens": 63430576} +{"current_steps": 109420, "total_steps": 119360, "loss": 0.2697, "lr": 2.098148583301507e-07, "epoch": 18.33445040214477, "percentage": 91.67, "elapsed_time": "4:19:24", "remaining_time": "0:23:33", "throughput": 4075.56, "total_tokens": 63433712} +{"current_steps": 109425, "total_steps": 119360, "loss": 0.1851, "lr": 2.0960533808580596e-07, "epoch": 18.33528820375335, "percentage": 91.68, "elapsed_time": "4:19:25", "remaining_time": "0:23:33", "throughput": 4075.57, "total_tokens": 63436496} +{"current_steps": 109430, "total_steps": 119360, "loss": 0.4922, "lr": 2.093959202670376e-07, "epoch": 18.33612600536193, "percentage": 91.68, "elapsed_time": "4:19:25", "remaining_time": "0:23:32", "throughput": 4075.59, "total_tokens": 63439504} +{"current_steps": 109435, "total_steps": 119360, "loss": 0.3808, "lr": 2.0918660487832033e-07, "epoch": 18.33696380697051, "percentage": 91.68, "elapsed_time": "4:19:26", "remaining_time": "0:23:31", "throughput": 4075.6, "total_tokens": 63442352} +{"current_steps": 109440, "total_steps": 119360, "loss": 0.209, "lr": 2.0897739192413112e-07, "epoch": 18.33780160857909, "percentage": 91.69, "elapsed_time": "4:19:27", "remaining_time": "0:23:31", "throughput": 4075.61, "total_tokens": 63445424} +{"current_steps": 109445, "total_steps": 119360, "loss": 0.1833, "lr": 2.087682814089431e-07, "epoch": 18.338639410187668, "percentage": 91.69, "elapsed_time": "4:19:27", "remaining_time": "0:23:30", "throughput": 4075.62, "total_tokens": 63448080} +{"current_steps": 109450, "total_steps": 119360, "loss": 0.5441, "lr": 2.085592733372266e-07, "epoch": 18.339477211796247, "percentage": 91.7, "elapsed_time": "4:19:28", "remaining_time": "0:23:29", "throughput": 4075.63, "total_tokens": 63451056} +{"current_steps": 109455, "total_steps": 119360, "loss": 0.1829, "lr": 2.083503677134513e-07, "epoch": 18.340315013404826, "percentage": 91.7, "elapsed_time": "4:19:29", "remaining_time": "0:23:28", "throughput": 4075.64, "total_tokens": 63454000} +{"current_steps": 109460, "total_steps": 119360, "loss": 0.3538, "lr": 2.0814156454208422e-07, "epoch": 18.341152815013405, "percentage": 91.71, "elapsed_time": "4:19:29", "remaining_time": "0:23:28", "throughput": 4075.65, "total_tokens": 63456784} +{"current_steps": 109465, "total_steps": 119360, "loss": 0.4175, "lr": 2.0793286382758903e-07, "epoch": 18.341990616621985, "percentage": 91.71, "elapsed_time": "4:19:30", "remaining_time": "0:23:27", "throughput": 4075.65, "total_tokens": 63459760} +{"current_steps": 109470, "total_steps": 119360, "loss": 0.4956, "lr": 2.0772426557442714e-07, "epoch": 18.342828418230564, "percentage": 91.71, "elapsed_time": "4:19:31", "remaining_time": "0:23:26", "throughput": 4075.66, "total_tokens": 63462608} +{"current_steps": 109475, "total_steps": 119360, "loss": 0.3667, "lr": 2.0751576978706166e-07, "epoch": 18.343666219839143, "percentage": 91.72, "elapsed_time": "4:19:31", "remaining_time": "0:23:26", "throughput": 4075.66, "total_tokens": 63465104} +{"current_steps": 109480, "total_steps": 119360, "loss": 0.3204, "lr": 2.0730737646994791e-07, "epoch": 18.344504021447722, "percentage": 91.72, "elapsed_time": "4:19:32", "remaining_time": "0:23:25", "throughput": 4075.67, "total_tokens": 63467760} +{"current_steps": 109485, "total_steps": 119360, "loss": 0.4651, "lr": 2.0709908562754232e-07, "epoch": 18.3453418230563, "percentage": 91.73, "elapsed_time": "4:19:33", "remaining_time": "0:23:24", "throughput": 4075.67, "total_tokens": 63470576} +{"current_steps": 109490, "total_steps": 119360, "loss": 0.3952, "lr": 2.0689089726429857e-07, "epoch": 18.34617962466488, "percentage": 91.73, "elapsed_time": "4:19:33", "remaining_time": "0:23:23", "throughput": 4075.68, "total_tokens": 63473968} +{"current_steps": 109495, "total_steps": 119360, "loss": 0.2528, "lr": 2.0668281138466805e-07, "epoch": 18.34701742627346, "percentage": 91.74, "elapsed_time": "4:19:34", "remaining_time": "0:23:23", "throughput": 4075.7, "total_tokens": 63476880} +{"current_steps": 109500, "total_steps": 119360, "loss": 0.1845, "lr": 2.0647482799310003e-07, "epoch": 18.347855227882036, "percentage": 91.74, "elapsed_time": "4:19:35", "remaining_time": "0:23:22", "throughput": 4075.7, "total_tokens": 63479440} +{"current_steps": 109505, "total_steps": 119360, "loss": 0.5574, "lr": 2.062669470940426e-07, "epoch": 18.348693029490615, "percentage": 91.74, "elapsed_time": "4:19:35", "remaining_time": "0:23:21", "throughput": 4075.7, "total_tokens": 63482128} +{"current_steps": 109510, "total_steps": 119360, "loss": 0.2187, "lr": 2.060591686919372e-07, "epoch": 18.349530831099194, "percentage": 91.75, "elapsed_time": "4:19:36", "remaining_time": "0:23:21", "throughput": 4075.72, "total_tokens": 63485136} +{"current_steps": 109515, "total_steps": 119360, "loss": 0.4238, "lr": 2.0585149279122972e-07, "epoch": 18.350368632707774, "percentage": 91.75, "elapsed_time": "4:19:37", "remaining_time": "0:23:20", "throughput": 4075.72, "total_tokens": 63487760} +{"current_steps": 109520, "total_steps": 119360, "loss": 0.5205, "lr": 2.0564391939635997e-07, "epoch": 18.351206434316353, "percentage": 91.76, "elapsed_time": "4:19:37", "remaining_time": "0:23:19", "throughput": 4075.73, "total_tokens": 63490448} +{"current_steps": 109525, "total_steps": 119360, "loss": 0.2465, "lr": 2.0543644851176547e-07, "epoch": 18.352044235924932, "percentage": 91.76, "elapsed_time": "4:19:38", "remaining_time": "0:23:18", "throughput": 4075.74, "total_tokens": 63493296} +{"current_steps": 109530, "total_steps": 119360, "loss": 0.3228, "lr": 2.0522908014188103e-07, "epoch": 18.35288203753351, "percentage": 91.76, "elapsed_time": "4:19:39", "remaining_time": "0:23:18", "throughput": 4075.75, "total_tokens": 63496080} +{"current_steps": 109535, "total_steps": 119360, "loss": 0.3629, "lr": 2.0502181429114365e-07, "epoch": 18.35371983914209, "percentage": 91.77, "elapsed_time": "4:19:39", "remaining_time": "0:23:17", "throughput": 4075.76, "total_tokens": 63499024} +{"current_steps": 109540, "total_steps": 119360, "loss": 0.3436, "lr": 2.0481465096398257e-07, "epoch": 18.35455764075067, "percentage": 91.77, "elapsed_time": "4:19:40", "remaining_time": "0:23:16", "throughput": 4075.77, "total_tokens": 63502032} +{"current_steps": 109545, "total_steps": 119360, "loss": 0.3812, "lr": 2.046075901648281e-07, "epoch": 18.35539544235925, "percentage": 91.78, "elapsed_time": "4:19:41", "remaining_time": "0:23:16", "throughput": 4075.78, "total_tokens": 63505072} +{"current_steps": 109550, "total_steps": 119360, "loss": 0.3658, "lr": 2.0440063189810677e-07, "epoch": 18.35623324396783, "percentage": 91.78, "elapsed_time": "4:19:41", "remaining_time": "0:23:15", "throughput": 4075.79, "total_tokens": 63507888} +{"current_steps": 109555, "total_steps": 119360, "loss": 0.5106, "lr": 2.0419377616824442e-07, "epoch": 18.357071045576408, "percentage": 91.79, "elapsed_time": "4:19:42", "remaining_time": "0:23:14", "throughput": 4075.8, "total_tokens": 63510800} +{"current_steps": 109560, "total_steps": 119360, "loss": 0.1052, "lr": 2.0398702297966365e-07, "epoch": 18.357908847184987, "percentage": 91.79, "elapsed_time": "4:19:43", "remaining_time": "0:23:13", "throughput": 4075.81, "total_tokens": 63513648} +{"current_steps": 109565, "total_steps": 119360, "loss": 0.2691, "lr": 2.0378037233678593e-07, "epoch": 18.358746648793566, "percentage": 91.79, "elapsed_time": "4:19:43", "remaining_time": "0:23:13", "throughput": 4075.82, "total_tokens": 63516336} +{"current_steps": 109570, "total_steps": 119360, "loss": 0.4437, "lr": 2.0357382424402772e-07, "epoch": 18.359584450402146, "percentage": 91.8, "elapsed_time": "4:19:44", "remaining_time": "0:23:12", "throughput": 4075.83, "total_tokens": 63519184} +{"current_steps": 109575, "total_steps": 119360, "loss": 0.3573, "lr": 2.0336737870580658e-07, "epoch": 18.360422252010725, "percentage": 91.8, "elapsed_time": "4:19:45", "remaining_time": "0:23:11", "throughput": 4075.84, "total_tokens": 63522224} +{"current_steps": 109580, "total_steps": 119360, "loss": 0.4098, "lr": 2.031610357265379e-07, "epoch": 18.361260053619304, "percentage": 91.81, "elapsed_time": "4:19:45", "remaining_time": "0:23:11", "throughput": 4075.86, "total_tokens": 63525168} +{"current_steps": 109585, "total_steps": 119360, "loss": 0.2077, "lr": 2.0295479531063144e-07, "epoch": 18.362097855227884, "percentage": 91.81, "elapsed_time": "4:19:46", "remaining_time": "0:23:10", "throughput": 4075.87, "total_tokens": 63528304} +{"current_steps": 109590, "total_steps": 119360, "loss": 0.2295, "lr": 2.027486574624976e-07, "epoch": 18.362935656836463, "percentage": 91.81, "elapsed_time": "4:19:47", "remaining_time": "0:23:09", "throughput": 4075.88, "total_tokens": 63531472} +{"current_steps": 109595, "total_steps": 119360, "loss": 0.3614, "lr": 2.0254262218654452e-07, "epoch": 18.36377345844504, "percentage": 91.82, "elapsed_time": "4:19:47", "remaining_time": "0:23:08", "throughput": 4075.89, "total_tokens": 63534288} +{"current_steps": 109600, "total_steps": 119360, "loss": 0.1004, "lr": 2.0233668948717699e-07, "epoch": 18.364611260053618, "percentage": 91.82, "elapsed_time": "4:19:48", "remaining_time": "0:23:08", "throughput": 4075.9, "total_tokens": 63537040} +{"current_steps": 109605, "total_steps": 119360, "loss": 0.2633, "lr": 2.0213085936879816e-07, "epoch": 18.365449061662197, "percentage": 91.83, "elapsed_time": "4:19:49", "remaining_time": "0:23:07", "throughput": 4075.9, "total_tokens": 63539536} +{"current_steps": 109610, "total_steps": 119360, "loss": 0.1165, "lr": 2.0192513183580952e-07, "epoch": 18.366286863270776, "percentage": 91.83, "elapsed_time": "4:19:49", "remaining_time": "0:23:06", "throughput": 4075.9, "total_tokens": 63542256} +{"current_steps": 109615, "total_steps": 119360, "loss": 0.2593, "lr": 2.0171950689260866e-07, "epoch": 18.367124664879356, "percentage": 91.84, "elapsed_time": "4:19:50", "remaining_time": "0:23:06", "throughput": 4075.91, "total_tokens": 63545136} +{"current_steps": 109620, "total_steps": 119360, "loss": 0.4945, "lr": 2.0151398454359317e-07, "epoch": 18.367962466487935, "percentage": 91.84, "elapsed_time": "4:19:51", "remaining_time": "0:23:05", "throughput": 4075.92, "total_tokens": 63547888} +{"current_steps": 109625, "total_steps": 119360, "loss": 0.2874, "lr": 2.0130856479315787e-07, "epoch": 18.368800268096514, "percentage": 91.84, "elapsed_time": "4:19:51", "remaining_time": "0:23:04", "throughput": 4075.93, "total_tokens": 63551024} +{"current_steps": 109630, "total_steps": 119360, "loss": 0.3821, "lr": 2.0110324764569255e-07, "epoch": 18.369638069705093, "percentage": 91.85, "elapsed_time": "4:19:52", "remaining_time": "0:23:03", "throughput": 4075.94, "total_tokens": 63554000} +{"current_steps": 109635, "total_steps": 119360, "loss": 0.3323, "lr": 2.0089803310558987e-07, "epoch": 18.370475871313673, "percentage": 91.85, "elapsed_time": "4:19:53", "remaining_time": "0:23:03", "throughput": 4075.96, "total_tokens": 63556944} +{"current_steps": 109640, "total_steps": 119360, "loss": 0.4217, "lr": 2.0069292117723681e-07, "epoch": 18.371313672922252, "percentage": 91.86, "elapsed_time": "4:19:53", "remaining_time": "0:23:02", "throughput": 4075.97, "total_tokens": 63559888} +{"current_steps": 109645, "total_steps": 119360, "loss": 0.3166, "lr": 2.0048791186501825e-07, "epoch": 18.37215147453083, "percentage": 91.86, "elapsed_time": "4:19:54", "remaining_time": "0:23:01", "throughput": 4075.98, "total_tokens": 63562768} +{"current_steps": 109650, "total_steps": 119360, "loss": 0.1897, "lr": 2.0028300517331844e-07, "epoch": 18.37298927613941, "percentage": 91.86, "elapsed_time": "4:19:55", "remaining_time": "0:23:01", "throughput": 4075.98, "total_tokens": 63565552} +{"current_steps": 109655, "total_steps": 119360, "loss": 0.338, "lr": 2.0007820110651777e-07, "epoch": 18.37382707774799, "percentage": 91.87, "elapsed_time": "4:19:55", "remaining_time": "0:23:00", "throughput": 4075.99, "total_tokens": 63568464} +{"current_steps": 109660, "total_steps": 119360, "loss": 0.3521, "lr": 1.998734996689955e-07, "epoch": 18.37466487935657, "percentage": 91.87, "elapsed_time": "4:19:56", "remaining_time": "0:22:59", "throughput": 4076.0, "total_tokens": 63571088} +{"current_steps": 109665, "total_steps": 119360, "loss": 0.5774, "lr": 1.996689008651287e-07, "epoch": 18.37550268096515, "percentage": 91.88, "elapsed_time": "4:19:57", "remaining_time": "0:22:58", "throughput": 4076.01, "total_tokens": 63574000} +{"current_steps": 109670, "total_steps": 119360, "loss": 0.3681, "lr": 1.9946440469929275e-07, "epoch": 18.376340482573728, "percentage": 91.88, "elapsed_time": "4:19:57", "remaining_time": "0:22:58", "throughput": 4076.02, "total_tokens": 63577040} +{"current_steps": 109675, "total_steps": 119360, "loss": 0.3427, "lr": 1.9926001117585747e-07, "epoch": 18.377178284182307, "percentage": 91.89, "elapsed_time": "4:19:58", "remaining_time": "0:22:57", "throughput": 4076.03, "total_tokens": 63579888} +{"current_steps": 109680, "total_steps": 119360, "loss": 0.5033, "lr": 1.9905572029919607e-07, "epoch": 18.378016085790886, "percentage": 91.89, "elapsed_time": "4:19:59", "remaining_time": "0:22:56", "throughput": 4076.03, "total_tokens": 63582352} +{"current_steps": 109685, "total_steps": 119360, "loss": 0.2744, "lr": 1.9885153207367557e-07, "epoch": 18.378853887399465, "percentage": 91.89, "elapsed_time": "4:19:59", "remaining_time": "0:22:56", "throughput": 4076.03, "total_tokens": 63585200} +{"current_steps": 109690, "total_steps": 119360, "loss": 0.2397, "lr": 1.9864744650366085e-07, "epoch": 18.379691689008045, "percentage": 91.9, "elapsed_time": "4:20:00", "remaining_time": "0:22:55", "throughput": 4076.04, "total_tokens": 63588080} +{"current_steps": 109695, "total_steps": 119360, "loss": 0.5861, "lr": 1.9844346359351618e-07, "epoch": 18.38052949061662, "percentage": 91.9, "elapsed_time": "4:20:01", "remaining_time": "0:22:54", "throughput": 4076.05, "total_tokens": 63590768} +{"current_steps": 109700, "total_steps": 119360, "loss": 0.3801, "lr": 1.9823958334760364e-07, "epoch": 18.3813672922252, "percentage": 91.91, "elapsed_time": "4:20:01", "remaining_time": "0:22:53", "throughput": 4076.06, "total_tokens": 63593488} +{"current_steps": 109705, "total_steps": 119360, "loss": 0.2285, "lr": 1.980358057702819e-07, "epoch": 18.38220509383378, "percentage": 91.91, "elapsed_time": "4:20:02", "remaining_time": "0:22:53", "throughput": 4076.06, "total_tokens": 63596240} +{"current_steps": 109710, "total_steps": 119360, "loss": 0.1276, "lr": 1.9783213086590814e-07, "epoch": 18.383042895442358, "percentage": 91.92, "elapsed_time": "4:20:03", "remaining_time": "0:22:52", "throughput": 4076.08, "total_tokens": 63599280} +{"current_steps": 109715, "total_steps": 119360, "loss": 0.5262, "lr": 1.9762855863883658e-07, "epoch": 18.383880697050937, "percentage": 91.92, "elapsed_time": "4:20:03", "remaining_time": "0:22:51", "throughput": 4076.08, "total_tokens": 63601936} +{"current_steps": 109720, "total_steps": 119360, "loss": 0.3563, "lr": 1.9742508909342095e-07, "epoch": 18.384718498659517, "percentage": 91.92, "elapsed_time": "4:20:04", "remaining_time": "0:22:51", "throughput": 4076.09, "total_tokens": 63604848} +{"current_steps": 109725, "total_steps": 119360, "loss": 0.2266, "lr": 1.9722172223401116e-07, "epoch": 18.385556300268096, "percentage": 91.93, "elapsed_time": "4:20:05", "remaining_time": "0:22:50", "throughput": 4076.1, "total_tokens": 63607504} +{"current_steps": 109730, "total_steps": 119360, "loss": 0.1179, "lr": 1.9701845806495646e-07, "epoch": 18.386394101876675, "percentage": 91.93, "elapsed_time": "4:20:05", "remaining_time": "0:22:49", "throughput": 4076.1, "total_tokens": 63610384} +{"current_steps": 109735, "total_steps": 119360, "loss": 0.408, "lr": 1.9681529659060007e-07, "epoch": 18.387231903485254, "percentage": 91.94, "elapsed_time": "4:20:06", "remaining_time": "0:22:48", "throughput": 4076.12, "total_tokens": 63613360} +{"current_steps": 109740, "total_steps": 119360, "loss": 0.4922, "lr": 1.9661223781528904e-07, "epoch": 18.388069705093834, "percentage": 91.94, "elapsed_time": "4:20:07", "remaining_time": "0:22:48", "throughput": 4076.12, "total_tokens": 63616048} +{"current_steps": 109745, "total_steps": 119360, "loss": 0.4325, "lr": 1.9640928174336438e-07, "epoch": 18.388907506702413, "percentage": 91.94, "elapsed_time": "4:20:07", "remaining_time": "0:22:47", "throughput": 4076.13, "total_tokens": 63618960} +{"current_steps": 109750, "total_steps": 119360, "loss": 0.4687, "lr": 1.9620642837916482e-07, "epoch": 18.389745308310992, "percentage": 91.95, "elapsed_time": "4:20:08", "remaining_time": "0:22:46", "throughput": 4076.15, "total_tokens": 63622128} +{"current_steps": 109755, "total_steps": 119360, "loss": 0.1825, "lr": 1.9600367772702689e-07, "epoch": 18.39058310991957, "percentage": 91.95, "elapsed_time": "4:20:09", "remaining_time": "0:22:45", "throughput": 4076.16, "total_tokens": 63624848} +{"current_steps": 109760, "total_steps": 119360, "loss": 0.4327, "lr": 1.9580102979128822e-07, "epoch": 18.39142091152815, "percentage": 91.96, "elapsed_time": "4:20:09", "remaining_time": "0:22:45", "throughput": 4076.17, "total_tokens": 63627568} +{"current_steps": 109765, "total_steps": 119360, "loss": 0.5012, "lr": 1.9559848457627927e-07, "epoch": 18.39225871313673, "percentage": 91.96, "elapsed_time": "4:20:10", "remaining_time": "0:22:44", "throughput": 4076.18, "total_tokens": 63630640} +{"current_steps": 109770, "total_steps": 119360, "loss": 0.4145, "lr": 1.9539604208633212e-07, "epoch": 18.39309651474531, "percentage": 91.97, "elapsed_time": "4:20:11", "remaining_time": "0:22:43", "throughput": 4076.19, "total_tokens": 63633648} +{"current_steps": 109775, "total_steps": 119360, "loss": 0.5142, "lr": 1.951937023257744e-07, "epoch": 18.39393431635389, "percentage": 91.97, "elapsed_time": "4:20:11", "remaining_time": "0:22:43", "throughput": 4076.2, "total_tokens": 63636528} +{"current_steps": 109780, "total_steps": 119360, "loss": 0.2834, "lr": 1.949914652989332e-07, "epoch": 18.394772117962468, "percentage": 91.97, "elapsed_time": "4:20:12", "remaining_time": "0:22:42", "throughput": 4076.21, "total_tokens": 63639152} +{"current_steps": 109785, "total_steps": 119360, "loss": 0.2552, "lr": 1.947893310101323e-07, "epoch": 18.395609919571047, "percentage": 91.98, "elapsed_time": "4:20:13", "remaining_time": "0:22:41", "throughput": 4076.21, "total_tokens": 63642000} +{"current_steps": 109790, "total_steps": 119360, "loss": 0.1637, "lr": 1.945872994636938e-07, "epoch": 18.396447721179626, "percentage": 91.98, "elapsed_time": "4:20:13", "remaining_time": "0:22:40", "throughput": 4076.23, "total_tokens": 63645104} +{"current_steps": 109795, "total_steps": 119360, "loss": 0.3542, "lr": 1.9438537066393647e-07, "epoch": 18.397285522788202, "percentage": 91.99, "elapsed_time": "4:20:14", "remaining_time": "0:22:40", "throughput": 4076.24, "total_tokens": 63648368} +{"current_steps": 109800, "total_steps": 119360, "loss": 0.4282, "lr": 1.9418354461517962e-07, "epoch": 18.39812332439678, "percentage": 91.99, "elapsed_time": "4:20:15", "remaining_time": "0:22:39", "throughput": 4076.25, "total_tokens": 63651120} +{"current_steps": 109805, "total_steps": 119360, "loss": 0.3448, "lr": 1.9398182132173759e-07, "epoch": 18.39896112600536, "percentage": 91.99, "elapsed_time": "4:20:15", "remaining_time": "0:22:38", "throughput": 4076.26, "total_tokens": 63653904} +{"current_steps": 109810, "total_steps": 119360, "loss": 0.1638, "lr": 1.9378020078792303e-07, "epoch": 18.39979892761394, "percentage": 92.0, "elapsed_time": "4:20:16", "remaining_time": "0:22:38", "throughput": 4076.27, "total_tokens": 63656944} +{"current_steps": 109815, "total_steps": 119360, "loss": 0.435, "lr": 1.9357868301804805e-07, "epoch": 18.40063672922252, "percentage": 92.0, "elapsed_time": "4:20:17", "remaining_time": "0:22:37", "throughput": 4076.28, "total_tokens": 63659696} +{"current_steps": 109820, "total_steps": 119360, "loss": 0.3947, "lr": 1.9337726801641975e-07, "epoch": 18.4014745308311, "percentage": 92.01, "elapsed_time": "4:20:17", "remaining_time": "0:22:36", "throughput": 4076.29, "total_tokens": 63662608} +{"current_steps": 109825, "total_steps": 119360, "loss": 0.1782, "lr": 1.9317595578734638e-07, "epoch": 18.402312332439678, "percentage": 92.01, "elapsed_time": "4:20:18", "remaining_time": "0:22:35", "throughput": 4076.3, "total_tokens": 63665456} +{"current_steps": 109830, "total_steps": 119360, "loss": 0.3127, "lr": 1.9297474633513112e-07, "epoch": 18.403150134048257, "percentage": 92.02, "elapsed_time": "4:20:19", "remaining_time": "0:22:35", "throughput": 4076.31, "total_tokens": 63668432} +{"current_steps": 109835, "total_steps": 119360, "loss": 0.4161, "lr": 1.9277363966407782e-07, "epoch": 18.403987935656836, "percentage": 92.02, "elapsed_time": "4:20:19", "remaining_time": "0:22:34", "throughput": 4076.32, "total_tokens": 63671088} +{"current_steps": 109840, "total_steps": 119360, "loss": 0.2934, "lr": 1.925726357784835e-07, "epoch": 18.404825737265416, "percentage": 92.02, "elapsed_time": "4:20:20", "remaining_time": "0:22:33", "throughput": 4076.33, "total_tokens": 63674032} +{"current_steps": 109845, "total_steps": 119360, "loss": 0.4969, "lr": 1.9237173468264814e-07, "epoch": 18.405663538873995, "percentage": 92.03, "elapsed_time": "4:20:21", "remaining_time": "0:22:33", "throughput": 4076.34, "total_tokens": 63676752} +{"current_steps": 109850, "total_steps": 119360, "loss": 0.1446, "lr": 1.9217093638086713e-07, "epoch": 18.406501340482574, "percentage": 92.03, "elapsed_time": "4:20:21", "remaining_time": "0:22:32", "throughput": 4076.35, "total_tokens": 63679696} +{"current_steps": 109855, "total_steps": 119360, "loss": 0.3117, "lr": 1.919702408774332e-07, "epoch": 18.407339142091153, "percentage": 92.04, "elapsed_time": "4:20:22", "remaining_time": "0:22:31", "throughput": 4076.36, "total_tokens": 63682864} +{"current_steps": 109860, "total_steps": 119360, "loss": 0.3571, "lr": 1.9176964817663734e-07, "epoch": 18.408176943699733, "percentage": 92.04, "elapsed_time": "4:20:23", "remaining_time": "0:22:30", "throughput": 4076.37, "total_tokens": 63685552} +{"current_steps": 109865, "total_steps": 119360, "loss": 0.5437, "lr": 1.9156915828277002e-07, "epoch": 18.409014745308312, "percentage": 92.05, "elapsed_time": "4:20:23", "remaining_time": "0:22:30", "throughput": 4076.38, "total_tokens": 63688304} +{"current_steps": 109870, "total_steps": 119360, "loss": 0.2894, "lr": 1.913687712001161e-07, "epoch": 18.40985254691689, "percentage": 92.05, "elapsed_time": "4:20:24", "remaining_time": "0:22:29", "throughput": 4076.39, "total_tokens": 63691408} +{"current_steps": 109875, "total_steps": 119360, "loss": 0.2354, "lr": 1.9116848693296108e-07, "epoch": 18.41069034852547, "percentage": 92.05, "elapsed_time": "4:20:25", "remaining_time": "0:22:28", "throughput": 4076.39, "total_tokens": 63693968} +{"current_steps": 109880, "total_steps": 119360, "loss": 0.5281, "lr": 1.909683054855871e-07, "epoch": 18.41152815013405, "percentage": 92.06, "elapsed_time": "4:20:25", "remaining_time": "0:22:28", "throughput": 4076.39, "total_tokens": 63696496} +{"current_steps": 109885, "total_steps": 119360, "loss": 0.4793, "lr": 1.907682268622746e-07, "epoch": 18.41236595174263, "percentage": 92.06, "elapsed_time": "4:20:26", "remaining_time": "0:22:27", "throughput": 4076.41, "total_tokens": 63699824} +{"current_steps": 109890, "total_steps": 119360, "loss": 0.2513, "lr": 1.9056825106730127e-07, "epoch": 18.413203753351205, "percentage": 92.07, "elapsed_time": "4:20:27", "remaining_time": "0:22:26", "throughput": 4076.42, "total_tokens": 63702608} +{"current_steps": 109895, "total_steps": 119360, "loss": 0.3701, "lr": 1.9036837810494367e-07, "epoch": 18.414041554959784, "percentage": 92.07, "elapsed_time": "4:20:27", "remaining_time": "0:22:25", "throughput": 4076.43, "total_tokens": 63705584} +{"current_steps": 109900, "total_steps": 119360, "loss": 0.3405, "lr": 1.9016860797947345e-07, "epoch": 18.414879356568363, "percentage": 92.07, "elapsed_time": "4:20:28", "remaining_time": "0:22:25", "throughput": 4076.44, "total_tokens": 63708400} +{"current_steps": 109905, "total_steps": 119360, "loss": 0.4537, "lr": 1.899689406951638e-07, "epoch": 18.415717158176943, "percentage": 92.08, "elapsed_time": "4:20:29", "remaining_time": "0:22:24", "throughput": 4076.45, "total_tokens": 63711408} +{"current_steps": 109910, "total_steps": 119360, "loss": 0.4086, "lr": 1.8976937625628355e-07, "epoch": 18.416554959785522, "percentage": 92.08, "elapsed_time": "4:20:29", "remaining_time": "0:22:23", "throughput": 4076.46, "total_tokens": 63714160} +{"current_steps": 109915, "total_steps": 119360, "loss": 0.2049, "lr": 1.8956991466709928e-07, "epoch": 18.4173927613941, "percentage": 92.09, "elapsed_time": "4:20:30", "remaining_time": "0:22:23", "throughput": 4076.47, "total_tokens": 63717040} +{"current_steps": 109920, "total_steps": 119360, "loss": 0.6192, "lr": 1.8937055593187593e-07, "epoch": 18.41823056300268, "percentage": 92.09, "elapsed_time": "4:20:31", "remaining_time": "0:22:22", "throughput": 4076.47, "total_tokens": 63719824} +{"current_steps": 109925, "total_steps": 119360, "loss": 0.2979, "lr": 1.8917130005487616e-07, "epoch": 18.41906836461126, "percentage": 92.1, "elapsed_time": "4:20:31", "remaining_time": "0:22:21", "throughput": 4076.48, "total_tokens": 63722448} +{"current_steps": 109930, "total_steps": 119360, "loss": 0.3592, "lr": 1.889721470403605e-07, "epoch": 18.41990616621984, "percentage": 92.1, "elapsed_time": "4:20:32", "remaining_time": "0:22:20", "throughput": 4076.49, "total_tokens": 63725232} +{"current_steps": 109935, "total_steps": 119360, "loss": 0.3092, "lr": 1.8877309689258661e-07, "epoch": 18.420743967828418, "percentage": 92.1, "elapsed_time": "4:20:33", "remaining_time": "0:22:20", "throughput": 4076.5, "total_tokens": 63728144} +{"current_steps": 109940, "total_steps": 119360, "loss": 0.306, "lr": 1.8857414961581054e-07, "epoch": 18.421581769436997, "percentage": 92.11, "elapsed_time": "4:20:33", "remaining_time": "0:22:19", "throughput": 4076.51, "total_tokens": 63731088} +{"current_steps": 109945, "total_steps": 119360, "loss": 0.3353, "lr": 1.883753052142867e-07, "epoch": 18.422419571045577, "percentage": 92.11, "elapsed_time": "4:20:34", "remaining_time": "0:22:18", "throughput": 4076.53, "total_tokens": 63734192} +{"current_steps": 109950, "total_steps": 119360, "loss": 0.6317, "lr": 1.881765636922661e-07, "epoch": 18.423257372654156, "percentage": 92.12, "elapsed_time": "4:20:35", "remaining_time": "0:22:18", "throughput": 4076.54, "total_tokens": 63737136} +{"current_steps": 109955, "total_steps": 119360, "loss": 0.3323, "lr": 1.879779250539987e-07, "epoch": 18.424095174262735, "percentage": 92.12, "elapsed_time": "4:20:35", "remaining_time": "0:22:17", "throughput": 4076.54, "total_tokens": 63739984} +{"current_steps": 109960, "total_steps": 119360, "loss": 0.3483, "lr": 1.8777938930373052e-07, "epoch": 18.424932975871315, "percentage": 92.12, "elapsed_time": "4:20:36", "remaining_time": "0:22:16", "throughput": 4076.55, "total_tokens": 63742672} +{"current_steps": 109965, "total_steps": 119360, "loss": 0.4284, "lr": 1.8758095644570817e-07, "epoch": 18.425770777479894, "percentage": 92.13, "elapsed_time": "4:20:37", "remaining_time": "0:22:15", "throughput": 4076.55, "total_tokens": 63745360} +{"current_steps": 109970, "total_steps": 119360, "loss": 0.3118, "lr": 1.8738262648417327e-07, "epoch": 18.426608579088473, "percentage": 92.13, "elapsed_time": "4:20:37", "remaining_time": "0:22:15", "throughput": 4076.56, "total_tokens": 63748304} +{"current_steps": 109975, "total_steps": 119360, "loss": 0.2995, "lr": 1.871843994233663e-07, "epoch": 18.427446380697052, "percentage": 92.14, "elapsed_time": "4:20:38", "remaining_time": "0:22:14", "throughput": 4076.57, "total_tokens": 63751152} +{"current_steps": 109980, "total_steps": 119360, "loss": 0.3875, "lr": 1.8698627526752667e-07, "epoch": 18.42828418230563, "percentage": 92.14, "elapsed_time": "4:20:39", "remaining_time": "0:22:13", "throughput": 4076.58, "total_tokens": 63754096} +{"current_steps": 109985, "total_steps": 119360, "loss": 0.3013, "lr": 1.867882540208893e-07, "epoch": 18.42912198391421, "percentage": 92.15, "elapsed_time": "4:20:39", "remaining_time": "0:22:13", "throughput": 4076.6, "total_tokens": 63757456} +{"current_steps": 109990, "total_steps": 119360, "loss": 0.3233, "lr": 1.8659033568768914e-07, "epoch": 18.429959785522787, "percentage": 92.15, "elapsed_time": "4:20:40", "remaining_time": "0:22:12", "throughput": 4076.61, "total_tokens": 63760400} +{"current_steps": 109995, "total_steps": 119360, "loss": 0.4718, "lr": 1.8639252027215727e-07, "epoch": 18.430797587131366, "percentage": 92.15, "elapsed_time": "4:20:41", "remaining_time": "0:22:11", "throughput": 4076.61, "total_tokens": 63763120} +{"current_steps": 110000, "total_steps": 119360, "loss": 0.4462, "lr": 1.8619480777852418e-07, "epoch": 18.431635388739945, "percentage": 92.16, "elapsed_time": "4:20:41", "remaining_time": "0:22:10", "throughput": 4076.62, "total_tokens": 63765936} +{"current_steps": 110005, "total_steps": 119360, "loss": 0.5132, "lr": 1.8599719821101592e-07, "epoch": 18.432473190348524, "percentage": 92.16, "elapsed_time": "4:20:42", "remaining_time": "0:22:10", "throughput": 4076.63, "total_tokens": 63768880} +{"current_steps": 110010, "total_steps": 119360, "loss": 0.184, "lr": 1.8579969157385913e-07, "epoch": 18.433310991957104, "percentage": 92.17, "elapsed_time": "4:20:43", "remaining_time": "0:22:09", "throughput": 4076.64, "total_tokens": 63771728} +{"current_steps": 110015, "total_steps": 119360, "loss": 0.3605, "lr": 1.8560228787127654e-07, "epoch": 18.434148793565683, "percentage": 92.17, "elapsed_time": "4:20:43", "remaining_time": "0:22:08", "throughput": 4076.65, "total_tokens": 63774864} +{"current_steps": 110020, "total_steps": 119360, "loss": 0.3418, "lr": 1.8540498710748755e-07, "epoch": 18.434986595174262, "percentage": 92.17, "elapsed_time": "4:20:44", "remaining_time": "0:22:08", "throughput": 4076.66, "total_tokens": 63777712} +{"current_steps": 110025, "total_steps": 119360, "loss": 0.56, "lr": 1.8520778928671213e-07, "epoch": 18.43582439678284, "percentage": 92.18, "elapsed_time": "4:20:45", "remaining_time": "0:22:07", "throughput": 4076.66, "total_tokens": 63780368} +{"current_steps": 110030, "total_steps": 119360, "loss": 0.2793, "lr": 1.8501069441316577e-07, "epoch": 18.43666219839142, "percentage": 92.18, "elapsed_time": "4:20:46", "remaining_time": "0:22:06", "throughput": 4076.68, "total_tokens": 63783760} +{"current_steps": 110035, "total_steps": 119360, "loss": 0.4064, "lr": 1.8481370249106344e-07, "epoch": 18.4375, "percentage": 92.19, "elapsed_time": "4:20:46", "remaining_time": "0:22:05", "throughput": 4076.69, "total_tokens": 63786864} +{"current_steps": 110040, "total_steps": 119360, "loss": 0.2398, "lr": 1.846168135246168e-07, "epoch": 18.43833780160858, "percentage": 92.19, "elapsed_time": "4:20:47", "remaining_time": "0:22:05", "throughput": 4076.7, "total_tokens": 63789840} +{"current_steps": 110045, "total_steps": 119360, "loss": 0.4809, "lr": 1.8442002751803524e-07, "epoch": 18.43917560321716, "percentage": 92.2, "elapsed_time": "4:20:48", "remaining_time": "0:22:04", "throughput": 4076.7, "total_tokens": 63792624} +{"current_steps": 110050, "total_steps": 119360, "loss": 0.1845, "lr": 1.8422334447552647e-07, "epoch": 18.440013404825738, "percentage": 92.2, "elapsed_time": "4:20:48", "remaining_time": "0:22:03", "throughput": 4076.71, "total_tokens": 63795472} +{"current_steps": 110055, "total_steps": 119360, "loss": 0.1421, "lr": 1.8402676440129663e-07, "epoch": 18.440851206434317, "percentage": 92.2, "elapsed_time": "4:20:49", "remaining_time": "0:22:03", "throughput": 4076.73, "total_tokens": 63798352} +{"current_steps": 110060, "total_steps": 119360, "loss": 0.4824, "lr": 1.8383028729954845e-07, "epoch": 18.441689008042896, "percentage": 92.21, "elapsed_time": "4:20:50", "remaining_time": "0:22:02", "throughput": 4076.74, "total_tokens": 63801456} +{"current_steps": 110065, "total_steps": 119360, "loss": 0.3437, "lr": 1.8363391317448187e-07, "epoch": 18.442526809651476, "percentage": 92.21, "elapsed_time": "4:20:50", "remaining_time": "0:22:01", "throughput": 4076.75, "total_tokens": 63804272} +{"current_steps": 110070, "total_steps": 119360, "loss": 0.428, "lr": 1.8343764203029744e-07, "epoch": 18.443364611260055, "percentage": 92.22, "elapsed_time": "4:20:51", "remaining_time": "0:22:00", "throughput": 4076.75, "total_tokens": 63807088} +{"current_steps": 110075, "total_steps": 119360, "loss": 0.3004, "lr": 1.8324147387119074e-07, "epoch": 18.444202412868634, "percentage": 92.22, "elapsed_time": "4:20:52", "remaining_time": "0:22:00", "throughput": 4076.76, "total_tokens": 63809904} +{"current_steps": 110080, "total_steps": 119360, "loss": 0.3464, "lr": 1.8304540870135557e-07, "epoch": 18.445040214477213, "percentage": 92.23, "elapsed_time": "4:20:52", "remaining_time": "0:21:59", "throughput": 4076.77, "total_tokens": 63812688} +{"current_steps": 110085, "total_steps": 119360, "loss": 0.2945, "lr": 1.8284944652498525e-07, "epoch": 18.44587801608579, "percentage": 92.23, "elapsed_time": "4:20:53", "remaining_time": "0:21:58", "throughput": 4076.79, "total_tokens": 63815984} +{"current_steps": 110090, "total_steps": 119360, "loss": 0.3589, "lr": 1.826535873462687e-07, "epoch": 18.44671581769437, "percentage": 92.23, "elapsed_time": "4:20:54", "remaining_time": "0:21:58", "throughput": 4076.79, "total_tokens": 63818736} +{"current_steps": 110095, "total_steps": 119360, "loss": 0.2959, "lr": 1.8245783116939476e-07, "epoch": 18.447553619302948, "percentage": 92.24, "elapsed_time": "4:20:54", "remaining_time": "0:21:57", "throughput": 4076.8, "total_tokens": 63821552} +{"current_steps": 110100, "total_steps": 119360, "loss": 0.2704, "lr": 1.8226217799854785e-07, "epoch": 18.448391420911527, "percentage": 92.24, "elapsed_time": "4:20:55", "remaining_time": "0:21:56", "throughput": 4076.82, "total_tokens": 63824848} +{"current_steps": 110105, "total_steps": 119360, "loss": 0.3587, "lr": 1.820666278379124e-07, "epoch": 18.449229222520106, "percentage": 92.25, "elapsed_time": "4:20:56", "remaining_time": "0:21:56", "throughput": 4076.83, "total_tokens": 63827664} +{"current_steps": 110110, "total_steps": 119360, "loss": 0.5239, "lr": 1.8187118069166844e-07, "epoch": 18.450067024128685, "percentage": 92.25, "elapsed_time": "4:20:56", "remaining_time": "0:21:55", "throughput": 4076.84, "total_tokens": 63830576} +{"current_steps": 110115, "total_steps": 119360, "loss": 0.5194, "lr": 1.816758365639959e-07, "epoch": 18.450904825737265, "percentage": 92.25, "elapsed_time": "4:20:57", "remaining_time": "0:21:54", "throughput": 4076.85, "total_tokens": 63833616} +{"current_steps": 110120, "total_steps": 119360, "loss": 0.4046, "lr": 1.814805954590715e-07, "epoch": 18.451742627345844, "percentage": 92.26, "elapsed_time": "4:20:58", "remaining_time": "0:21:53", "throughput": 4076.86, "total_tokens": 63836528} +{"current_steps": 110125, "total_steps": 119360, "loss": 0.4107, "lr": 1.8128545738106852e-07, "epoch": 18.452580428954423, "percentage": 92.26, "elapsed_time": "4:20:58", "remaining_time": "0:21:53", "throughput": 4076.88, "total_tokens": 63839664} +{"current_steps": 110130, "total_steps": 119360, "loss": 0.4788, "lr": 1.8109042233416086e-07, "epoch": 18.453418230563003, "percentage": 92.27, "elapsed_time": "4:20:59", "remaining_time": "0:21:52", "throughput": 4076.88, "total_tokens": 63842384} +{"current_steps": 110135, "total_steps": 119360, "loss": 0.2525, "lr": 1.8089549032251797e-07, "epoch": 18.454256032171582, "percentage": 92.27, "elapsed_time": "4:21:00", "remaining_time": "0:21:51", "throughput": 4076.89, "total_tokens": 63845392} +{"current_steps": 110140, "total_steps": 119360, "loss": 0.3775, "lr": 1.8070066135030706e-07, "epoch": 18.45509383378016, "percentage": 92.28, "elapsed_time": "4:21:00", "remaining_time": "0:21:51", "throughput": 4076.9, "total_tokens": 63848176} +{"current_steps": 110145, "total_steps": 119360, "loss": 0.5041, "lr": 1.8050593542169537e-07, "epoch": 18.45593163538874, "percentage": 92.28, "elapsed_time": "4:21:01", "remaining_time": "0:21:50", "throughput": 4076.91, "total_tokens": 63850832} +{"current_steps": 110150, "total_steps": 119360, "loss": 0.3335, "lr": 1.803113125408451e-07, "epoch": 18.45676943699732, "percentage": 92.28, "elapsed_time": "4:21:02", "remaining_time": "0:21:49", "throughput": 4076.92, "total_tokens": 63853744} +{"current_steps": 110155, "total_steps": 119360, "loss": 0.4236, "lr": 1.8011679271191794e-07, "epoch": 18.4576072386059, "percentage": 92.29, "elapsed_time": "4:21:02", "remaining_time": "0:21:48", "throughput": 4076.92, "total_tokens": 63856528} +{"current_steps": 110160, "total_steps": 119360, "loss": 0.2816, "lr": 1.7992237593907335e-07, "epoch": 18.458445040214478, "percentage": 92.29, "elapsed_time": "4:21:03", "remaining_time": "0:21:48", "throughput": 4076.93, "total_tokens": 63859408} +{"current_steps": 110165, "total_steps": 119360, "loss": 0.2717, "lr": 1.7972806222646855e-07, "epoch": 18.459282841823057, "percentage": 92.3, "elapsed_time": "4:21:04", "remaining_time": "0:21:47", "throughput": 4076.95, "total_tokens": 63862448} +{"current_steps": 110170, "total_steps": 119360, "loss": 0.2682, "lr": 1.7953385157825686e-07, "epoch": 18.460120643431637, "percentage": 92.3, "elapsed_time": "4:21:04", "remaining_time": "0:21:46", "throughput": 4076.96, "total_tokens": 63865328} +{"current_steps": 110175, "total_steps": 119360, "loss": 0.2234, "lr": 1.7933974399859277e-07, "epoch": 18.460958445040216, "percentage": 92.3, "elapsed_time": "4:21:05", "remaining_time": "0:21:45", "throughput": 4076.96, "total_tokens": 63867984} +{"current_steps": 110180, "total_steps": 119360, "loss": 0.69, "lr": 1.791457394916246e-07, "epoch": 18.461796246648795, "percentage": 92.31, "elapsed_time": "4:21:06", "remaining_time": "0:21:45", "throughput": 4076.97, "total_tokens": 63870736} +{"current_steps": 110185, "total_steps": 119360, "loss": 0.3354, "lr": 1.7895183806150184e-07, "epoch": 18.46263404825737, "percentage": 92.31, "elapsed_time": "4:21:06", "remaining_time": "0:21:44", "throughput": 4076.97, "total_tokens": 63873680} +{"current_steps": 110190, "total_steps": 119360, "loss": 0.5806, "lr": 1.7875803971236948e-07, "epoch": 18.46347184986595, "percentage": 92.32, "elapsed_time": "4:21:07", "remaining_time": "0:21:43", "throughput": 4076.98, "total_tokens": 63876368} +{"current_steps": 110195, "total_steps": 119360, "loss": 0.3168, "lr": 1.7856434444837145e-07, "epoch": 18.46430965147453, "percentage": 92.32, "elapsed_time": "4:21:08", "remaining_time": "0:21:43", "throughput": 4076.99, "total_tokens": 63879376} +{"current_steps": 110200, "total_steps": 119360, "loss": 0.5496, "lr": 1.7837075227364943e-07, "epoch": 18.46514745308311, "percentage": 92.33, "elapsed_time": "4:21:08", "remaining_time": "0:21:42", "throughput": 4076.99, "total_tokens": 63882128} +{"current_steps": 110205, "total_steps": 119360, "loss": 0.2219, "lr": 1.7817726319234286e-07, "epoch": 18.465985254691688, "percentage": 92.33, "elapsed_time": "4:21:09", "remaining_time": "0:21:41", "throughput": 4077.01, "total_tokens": 63885488} +{"current_steps": 110210, "total_steps": 119360, "loss": 0.5089, "lr": 1.77983877208589e-07, "epoch": 18.466823056300267, "percentage": 92.33, "elapsed_time": "4:21:10", "remaining_time": "0:21:41", "throughput": 4077.03, "total_tokens": 63888368} +{"current_steps": 110215, "total_steps": 119360, "loss": 0.3919, "lr": 1.777905943265218e-07, "epoch": 18.467660857908847, "percentage": 92.34, "elapsed_time": "4:21:11", "remaining_time": "0:21:40", "throughput": 4077.04, "total_tokens": 63891280} +{"current_steps": 110220, "total_steps": 119360, "loss": 0.2751, "lr": 1.7759741455027513e-07, "epoch": 18.468498659517426, "percentage": 92.34, "elapsed_time": "4:21:11", "remaining_time": "0:21:39", "throughput": 4077.05, "total_tokens": 63894064} +{"current_steps": 110225, "total_steps": 119360, "loss": 0.3563, "lr": 1.7740433788397793e-07, "epoch": 18.469336461126005, "percentage": 92.35, "elapsed_time": "4:21:12", "remaining_time": "0:21:38", "throughput": 4077.06, "total_tokens": 63896944} +{"current_steps": 110230, "total_steps": 119360, "loss": 0.2545, "lr": 1.7721136433175912e-07, "epoch": 18.470174262734584, "percentage": 92.35, "elapsed_time": "4:21:12", "remaining_time": "0:21:38", "throughput": 4077.06, "total_tokens": 63899696} +{"current_steps": 110235, "total_steps": 119360, "loss": 0.2655, "lr": 1.7701849389774594e-07, "epoch": 18.471012064343164, "percentage": 92.36, "elapsed_time": "4:21:13", "remaining_time": "0:21:37", "throughput": 4077.07, "total_tokens": 63902448} +{"current_steps": 110240, "total_steps": 119360, "loss": 0.4067, "lr": 1.7682572658606068e-07, "epoch": 18.471849865951743, "percentage": 92.36, "elapsed_time": "4:21:14", "remaining_time": "0:21:36", "throughput": 4077.08, "total_tokens": 63905360} +{"current_steps": 110245, "total_steps": 119360, "loss": 0.5124, "lr": 1.7663306240082555e-07, "epoch": 18.472687667560322, "percentage": 92.36, "elapsed_time": "4:21:14", "remaining_time": "0:21:35", "throughput": 4077.09, "total_tokens": 63908112} +{"current_steps": 110250, "total_steps": 119360, "loss": 0.2134, "lr": 1.7644050134616008e-07, "epoch": 18.4735254691689, "percentage": 92.37, "elapsed_time": "4:21:15", "remaining_time": "0:21:35", "throughput": 4077.1, "total_tokens": 63911056} +{"current_steps": 110255, "total_steps": 119360, "loss": 0.356, "lr": 1.762480434261815e-07, "epoch": 18.47436327077748, "percentage": 92.37, "elapsed_time": "4:21:16", "remaining_time": "0:21:34", "throughput": 4077.11, "total_tokens": 63914000} +{"current_steps": 110260, "total_steps": 119360, "loss": 0.4255, "lr": 1.7605568864500487e-07, "epoch": 18.47520107238606, "percentage": 92.38, "elapsed_time": "4:21:16", "remaining_time": "0:21:33", "throughput": 4077.13, "total_tokens": 63917104} +{"current_steps": 110265, "total_steps": 119360, "loss": 0.2803, "lr": 1.7586343700674248e-07, "epoch": 18.47603887399464, "percentage": 92.38, "elapsed_time": "4:21:17", "remaining_time": "0:21:33", "throughput": 4077.14, "total_tokens": 63920272} +{"current_steps": 110270, "total_steps": 119360, "loss": 0.229, "lr": 1.7567128851550541e-07, "epoch": 18.47687667560322, "percentage": 92.38, "elapsed_time": "4:21:18", "remaining_time": "0:21:32", "throughput": 4077.15, "total_tokens": 63923024} +{"current_steps": 110275, "total_steps": 119360, "loss": 0.3271, "lr": 1.7547924317540211e-07, "epoch": 18.477714477211798, "percentage": 92.39, "elapsed_time": "4:21:19", "remaining_time": "0:21:31", "throughput": 4077.16, "total_tokens": 63925776} +{"current_steps": 110280, "total_steps": 119360, "loss": 0.319, "lr": 1.7528730099053926e-07, "epoch": 18.478552278820374, "percentage": 92.39, "elapsed_time": "4:21:19", "remaining_time": "0:21:31", "throughput": 4077.17, "total_tokens": 63928880} +{"current_steps": 110285, "total_steps": 119360, "loss": 0.3224, "lr": 1.7509546196501969e-07, "epoch": 18.479390080428953, "percentage": 92.4, "elapsed_time": "4:21:20", "remaining_time": "0:21:30", "throughput": 4077.18, "total_tokens": 63931728} +{"current_steps": 110290, "total_steps": 119360, "loss": 0.2291, "lr": 1.749037261029457e-07, "epoch": 18.480227882037532, "percentage": 92.4, "elapsed_time": "4:21:21", "remaining_time": "0:21:29", "throughput": 4077.19, "total_tokens": 63934672} +{"current_steps": 110295, "total_steps": 119360, "loss": 0.2917, "lr": 1.7471209340841788e-07, "epoch": 18.48106568364611, "percentage": 92.41, "elapsed_time": "4:21:21", "remaining_time": "0:21:28", "throughput": 4077.2, "total_tokens": 63937552} +{"current_steps": 110300, "total_steps": 119360, "loss": 0.3444, "lr": 1.7452056388553185e-07, "epoch": 18.48190348525469, "percentage": 92.41, "elapsed_time": "4:21:22", "remaining_time": "0:21:28", "throughput": 4077.2, "total_tokens": 63940176} +{"current_steps": 110305, "total_steps": 119360, "loss": 0.4063, "lr": 1.7432913753838377e-07, "epoch": 18.48274128686327, "percentage": 92.41, "elapsed_time": "4:21:23", "remaining_time": "0:21:27", "throughput": 4077.21, "total_tokens": 63942960} +{"current_steps": 110310, "total_steps": 119360, "loss": 0.3767, "lr": 1.7413781437106704e-07, "epoch": 18.48357908847185, "percentage": 92.42, "elapsed_time": "4:21:23", "remaining_time": "0:21:26", "throughput": 4077.23, "total_tokens": 63946000} +{"current_steps": 110315, "total_steps": 119360, "loss": 0.6259, "lr": 1.7394659438767115e-07, "epoch": 18.48441689008043, "percentage": 92.42, "elapsed_time": "4:21:24", "remaining_time": "0:21:26", "throughput": 4077.24, "total_tokens": 63949072} +{"current_steps": 110320, "total_steps": 119360, "loss": 0.3059, "lr": 1.737554775922856e-07, "epoch": 18.485254691689008, "percentage": 92.43, "elapsed_time": "4:21:25", "remaining_time": "0:21:25", "throughput": 4077.24, "total_tokens": 63951760} +{"current_steps": 110325, "total_steps": 119360, "loss": 0.2593, "lr": 1.7356446398899717e-07, "epoch": 18.486092493297587, "percentage": 92.43, "elapsed_time": "4:21:25", "remaining_time": "0:21:24", "throughput": 4077.25, "total_tokens": 63954800} +{"current_steps": 110330, "total_steps": 119360, "loss": 0.2611, "lr": 1.7337355358188924e-07, "epoch": 18.486930294906166, "percentage": 92.43, "elapsed_time": "4:21:26", "remaining_time": "0:21:23", "throughput": 4077.27, "total_tokens": 63957776} +{"current_steps": 110335, "total_steps": 119360, "loss": 0.5107, "lr": 1.7318274637504295e-07, "epoch": 18.487768096514746, "percentage": 92.44, "elapsed_time": "4:21:27", "remaining_time": "0:21:23", "throughput": 4077.27, "total_tokens": 63960528} +{"current_steps": 110340, "total_steps": 119360, "loss": 0.3195, "lr": 1.7299204237254008e-07, "epoch": 18.488605898123325, "percentage": 92.44, "elapsed_time": "4:21:27", "remaining_time": "0:21:22", "throughput": 4077.28, "total_tokens": 63963696} +{"current_steps": 110345, "total_steps": 119360, "loss": 0.1135, "lr": 1.728014415784568e-07, "epoch": 18.489443699731904, "percentage": 92.45, "elapsed_time": "4:21:28", "remaining_time": "0:21:21", "throughput": 4077.29, "total_tokens": 63966768} +{"current_steps": 110350, "total_steps": 119360, "loss": 0.4536, "lr": 1.7261094399686817e-07, "epoch": 18.490281501340483, "percentage": 92.45, "elapsed_time": "4:21:29", "remaining_time": "0:21:21", "throughput": 4077.3, "total_tokens": 63969584} +{"current_steps": 110355, "total_steps": 119360, "loss": 0.3949, "lr": 1.7242054963184818e-07, "epoch": 18.491119302949063, "percentage": 92.46, "elapsed_time": "4:21:29", "remaining_time": "0:21:20", "throughput": 4077.31, "total_tokens": 63972592} +{"current_steps": 110360, "total_steps": 119360, "loss": 0.4006, "lr": 1.7223025848746745e-07, "epoch": 18.491957104557642, "percentage": 92.46, "elapsed_time": "4:21:30", "remaining_time": "0:21:19", "throughput": 4077.32, "total_tokens": 63975504} +{"current_steps": 110365, "total_steps": 119360, "loss": 0.4218, "lr": 1.7204007056779436e-07, "epoch": 18.49279490616622, "percentage": 92.46, "elapsed_time": "4:21:31", "remaining_time": "0:21:18", "throughput": 4077.33, "total_tokens": 63978416} +{"current_steps": 110370, "total_steps": 119360, "loss": 0.2735, "lr": 1.7184998587689572e-07, "epoch": 18.4936327077748, "percentage": 92.47, "elapsed_time": "4:21:31", "remaining_time": "0:21:18", "throughput": 4077.34, "total_tokens": 63981136} +{"current_steps": 110375, "total_steps": 119360, "loss": 0.3176, "lr": 1.71660004418836e-07, "epoch": 18.49447050938338, "percentage": 92.47, "elapsed_time": "4:21:32", "remaining_time": "0:21:17", "throughput": 4077.34, "total_tokens": 63984048} +{"current_steps": 110380, "total_steps": 119360, "loss": 0.2468, "lr": 1.7147012619767644e-07, "epoch": 18.495308310991955, "percentage": 92.48, "elapsed_time": "4:21:33", "remaining_time": "0:21:16", "throughput": 4077.36, "total_tokens": 63987376} +{"current_steps": 110385, "total_steps": 119360, "loss": 0.261, "lr": 1.7128035121747876e-07, "epoch": 18.496146112600535, "percentage": 92.48, "elapsed_time": "4:21:34", "remaining_time": "0:21:16", "throughput": 4077.37, "total_tokens": 63990224} +{"current_steps": 110390, "total_steps": 119360, "loss": 0.2884, "lr": 1.7109067948229863e-07, "epoch": 18.496983914209114, "percentage": 92.48, "elapsed_time": "4:21:34", "remaining_time": "0:21:15", "throughput": 4077.37, "total_tokens": 63992880} +{"current_steps": 110395, "total_steps": 119360, "loss": 0.5054, "lr": 1.709011109961911e-07, "epoch": 18.497821715817693, "percentage": 92.49, "elapsed_time": "4:21:35", "remaining_time": "0:21:14", "throughput": 4077.38, "total_tokens": 63995664} +{"current_steps": 110400, "total_steps": 119360, "loss": 0.1465, "lr": 1.7071164576321243e-07, "epoch": 18.498659517426272, "percentage": 92.49, "elapsed_time": "4:21:35", "remaining_time": "0:21:13", "throughput": 4077.38, "total_tokens": 63998448} +{"current_steps": 110405, "total_steps": 119360, "loss": 0.3268, "lr": 1.7052228378741098e-07, "epoch": 18.49949731903485, "percentage": 92.5, "elapsed_time": "4:21:36", "remaining_time": "0:21:13", "throughput": 4077.4, "total_tokens": 64001456} +{"current_steps": 110410, "total_steps": 119360, "loss": 0.1318, "lr": 1.7033302507283634e-07, "epoch": 18.50033512064343, "percentage": 92.5, "elapsed_time": "4:21:37", "remaining_time": "0:21:12", "throughput": 4077.41, "total_tokens": 64004208} +{"current_steps": 110415, "total_steps": 119360, "loss": 0.2767, "lr": 1.7014386962353525e-07, "epoch": 18.50117292225201, "percentage": 92.51, "elapsed_time": "4:21:37", "remaining_time": "0:21:11", "throughput": 4077.41, "total_tokens": 64006896} +{"current_steps": 110420, "total_steps": 119360, "loss": 0.2592, "lr": 1.699548174435517e-07, "epoch": 18.50201072386059, "percentage": 92.51, "elapsed_time": "4:21:38", "remaining_time": "0:21:11", "throughput": 4077.43, "total_tokens": 64010000} +{"current_steps": 110425, "total_steps": 119360, "loss": 0.1853, "lr": 1.6976586853692856e-07, "epoch": 18.50284852546917, "percentage": 92.51, "elapsed_time": "4:21:39", "remaining_time": "0:21:10", "throughput": 4077.45, "total_tokens": 64013104} +{"current_steps": 110430, "total_steps": 119360, "loss": 0.3715, "lr": 1.695770229077065e-07, "epoch": 18.503686327077748, "percentage": 92.52, "elapsed_time": "4:21:39", "remaining_time": "0:21:09", "throughput": 4077.45, "total_tokens": 64015824} +{"current_steps": 110435, "total_steps": 119360, "loss": 0.3831, "lr": 1.6938828055992064e-07, "epoch": 18.504524128686327, "percentage": 92.52, "elapsed_time": "4:21:40", "remaining_time": "0:21:08", "throughput": 4077.45, "total_tokens": 64018608} +{"current_steps": 110440, "total_steps": 119360, "loss": 0.6791, "lr": 1.6919964149760936e-07, "epoch": 18.505361930294907, "percentage": 92.53, "elapsed_time": "4:21:41", "remaining_time": "0:21:08", "throughput": 4077.46, "total_tokens": 64021360} +{"current_steps": 110445, "total_steps": 119360, "loss": 0.1781, "lr": 1.6901110572480505e-07, "epoch": 18.506199731903486, "percentage": 92.53, "elapsed_time": "4:21:41", "remaining_time": "0:21:07", "throughput": 4077.47, "total_tokens": 64024272} +{"current_steps": 110450, "total_steps": 119360, "loss": 0.425, "lr": 1.6882267324553837e-07, "epoch": 18.507037533512065, "percentage": 92.54, "elapsed_time": "4:21:42", "remaining_time": "0:21:06", "throughput": 4077.47, "total_tokens": 64027024} +{"current_steps": 110455, "total_steps": 119360, "loss": 0.3977, "lr": 1.6863434406383828e-07, "epoch": 18.507875335120644, "percentage": 92.54, "elapsed_time": "4:21:43", "remaining_time": "0:21:06", "throughput": 4077.48, "total_tokens": 64029808} +{"current_steps": 110460, "total_steps": 119360, "loss": 0.3771, "lr": 1.684461181837327e-07, "epoch": 18.508713136729224, "percentage": 92.54, "elapsed_time": "4:21:43", "remaining_time": "0:21:05", "throughput": 4077.48, "total_tokens": 64032752} +{"current_steps": 110465, "total_steps": 119360, "loss": 0.3176, "lr": 1.6825799560924505e-07, "epoch": 18.509550938337803, "percentage": 92.55, "elapsed_time": "4:21:44", "remaining_time": "0:21:04", "throughput": 4077.49, "total_tokens": 64035504} +{"current_steps": 110470, "total_steps": 119360, "loss": 0.3191, "lr": 1.6806997634439826e-07, "epoch": 18.510388739946382, "percentage": 92.55, "elapsed_time": "4:21:45", "remaining_time": "0:21:03", "throughput": 4077.5, "total_tokens": 64038704} +{"current_steps": 110475, "total_steps": 119360, "loss": 0.4953, "lr": 1.6788206039321186e-07, "epoch": 18.51122654155496, "percentage": 92.56, "elapsed_time": "4:21:46", "remaining_time": "0:21:03", "throughput": 4077.51, "total_tokens": 64041456} +{"current_steps": 110480, "total_steps": 119360, "loss": 0.4266, "lr": 1.6769424775970434e-07, "epoch": 18.512064343163537, "percentage": 92.56, "elapsed_time": "4:21:46", "remaining_time": "0:21:02", "throughput": 4077.52, "total_tokens": 64044400} +{"current_steps": 110485, "total_steps": 119360, "loss": 0.4195, "lr": 1.6750653844789078e-07, "epoch": 18.512902144772116, "percentage": 92.56, "elapsed_time": "4:21:47", "remaining_time": "0:21:01", "throughput": 4077.53, "total_tokens": 64047440} +{"current_steps": 110490, "total_steps": 119360, "loss": 0.5685, "lr": 1.6731893246178633e-07, "epoch": 18.513739946380696, "percentage": 92.57, "elapsed_time": "4:21:48", "remaining_time": "0:21:01", "throughput": 4077.54, "total_tokens": 64050288} +{"current_steps": 110495, "total_steps": 119360, "loss": 0.8055, "lr": 1.6713142980539944e-07, "epoch": 18.514577747989275, "percentage": 92.57, "elapsed_time": "4:21:48", "remaining_time": "0:21:00", "throughput": 4077.54, "total_tokens": 64053040} +{"current_steps": 110500, "total_steps": 119360, "loss": 0.3505, "lr": 1.6694403048274133e-07, "epoch": 18.515415549597854, "percentage": 92.58, "elapsed_time": "4:21:49", "remaining_time": "0:20:59", "throughput": 4077.56, "total_tokens": 64056048} +{"current_steps": 110505, "total_steps": 119360, "loss": 0.4657, "lr": 1.6675673449781937e-07, "epoch": 18.516253351206434, "percentage": 92.58, "elapsed_time": "4:21:50", "remaining_time": "0:20:58", "throughput": 4077.56, "total_tokens": 64058864} +{"current_steps": 110510, "total_steps": 119360, "loss": 0.4818, "lr": 1.665695418546359e-07, "epoch": 18.517091152815013, "percentage": 92.59, "elapsed_time": "4:21:50", "remaining_time": "0:20:58", "throughput": 4077.58, "total_tokens": 64061840} +{"current_steps": 110515, "total_steps": 119360, "loss": 0.1575, "lr": 1.66382452557195e-07, "epoch": 18.517928954423592, "percentage": 92.59, "elapsed_time": "4:21:51", "remaining_time": "0:20:57", "throughput": 4077.58, "total_tokens": 64064624} +{"current_steps": 110520, "total_steps": 119360, "loss": 0.4222, "lr": 1.661954666094967e-07, "epoch": 18.51876675603217, "percentage": 92.59, "elapsed_time": "4:21:52", "remaining_time": "0:20:56", "throughput": 4077.58, "total_tokens": 64067152} +{"current_steps": 110525, "total_steps": 119360, "loss": 0.3304, "lr": 1.66008584015539e-07, "epoch": 18.51960455764075, "percentage": 92.6, "elapsed_time": "4:21:52", "remaining_time": "0:20:56", "throughput": 4077.59, "total_tokens": 64070128} +{"current_steps": 110530, "total_steps": 119360, "loss": 0.2045, "lr": 1.6582180477931697e-07, "epoch": 18.52044235924933, "percentage": 92.6, "elapsed_time": "4:21:53", "remaining_time": "0:20:55", "throughput": 4077.6, "total_tokens": 64072912} +{"current_steps": 110535, "total_steps": 119360, "loss": 0.4103, "lr": 1.656351289048258e-07, "epoch": 18.52128016085791, "percentage": 92.61, "elapsed_time": "4:21:54", "remaining_time": "0:20:54", "throughput": 4077.62, "total_tokens": 64076176} +{"current_steps": 110540, "total_steps": 119360, "loss": 0.395, "lr": 1.6544855639605505e-07, "epoch": 18.52211796246649, "percentage": 92.61, "elapsed_time": "4:21:54", "remaining_time": "0:20:53", "throughput": 4077.63, "total_tokens": 64078832} +{"current_steps": 110545, "total_steps": 119360, "loss": 0.2276, "lr": 1.652620872569949e-07, "epoch": 18.522955764075068, "percentage": 92.61, "elapsed_time": "4:21:55", "remaining_time": "0:20:53", "throughput": 4077.63, "total_tokens": 64081616} +{"current_steps": 110550, "total_steps": 119360, "loss": 0.2366, "lr": 1.650757214916332e-07, "epoch": 18.523793565683647, "percentage": 92.62, "elapsed_time": "4:21:56", "remaining_time": "0:20:52", "throughput": 4077.65, "total_tokens": 64084848} +{"current_steps": 110555, "total_steps": 119360, "loss": 0.2486, "lr": 1.6488945910395292e-07, "epoch": 18.524631367292226, "percentage": 92.62, "elapsed_time": "4:21:56", "remaining_time": "0:20:51", "throughput": 4077.66, "total_tokens": 64087824} +{"current_steps": 110560, "total_steps": 119360, "loss": 0.3501, "lr": 1.64703300097937e-07, "epoch": 18.525469168900806, "percentage": 92.63, "elapsed_time": "4:21:57", "remaining_time": "0:20:51", "throughput": 4077.67, "total_tokens": 64090736} +{"current_steps": 110565, "total_steps": 119360, "loss": 0.466, "lr": 1.6451724447756724e-07, "epoch": 18.526306970509385, "percentage": 92.63, "elapsed_time": "4:21:58", "remaining_time": "0:20:50", "throughput": 4077.68, "total_tokens": 64093808} +{"current_steps": 110570, "total_steps": 119360, "loss": 0.6048, "lr": 1.6433129224682042e-07, "epoch": 18.527144772117964, "percentage": 92.64, "elapsed_time": "4:21:58", "remaining_time": "0:20:49", "throughput": 4077.7, "total_tokens": 64097072} +{"current_steps": 110575, "total_steps": 119360, "loss": 0.5503, "lr": 1.6414544340967287e-07, "epoch": 18.52798257372654, "percentage": 92.64, "elapsed_time": "4:21:59", "remaining_time": "0:20:48", "throughput": 4077.7, "total_tokens": 64099824} +{"current_steps": 110580, "total_steps": 119360, "loss": 0.5379, "lr": 1.6395969797009803e-07, "epoch": 18.52882037533512, "percentage": 92.64, "elapsed_time": "4:22:00", "remaining_time": "0:20:48", "throughput": 4077.72, "total_tokens": 64102768} +{"current_steps": 110585, "total_steps": 119360, "loss": 0.2023, "lr": 1.6377405593206773e-07, "epoch": 18.5296581769437, "percentage": 92.65, "elapsed_time": "4:22:00", "remaining_time": "0:20:47", "throughput": 4077.73, "total_tokens": 64105616} +{"current_steps": 110590, "total_steps": 119360, "loss": 0.286, "lr": 1.6358851729955105e-07, "epoch": 18.530495978552278, "percentage": 92.65, "elapsed_time": "4:22:01", "remaining_time": "0:20:46", "throughput": 4077.73, "total_tokens": 64108496} +{"current_steps": 110595, "total_steps": 119360, "loss": 0.2156, "lr": 1.634030820765159e-07, "epoch": 18.531333780160857, "percentage": 92.66, "elapsed_time": "4:22:02", "remaining_time": "0:20:46", "throughput": 4077.74, "total_tokens": 64111280} +{"current_steps": 110600, "total_steps": 119360, "loss": 0.211, "lr": 1.6321775026692578e-07, "epoch": 18.532171581769436, "percentage": 92.66, "elapsed_time": "4:22:02", "remaining_time": "0:20:45", "throughput": 4077.75, "total_tokens": 64114096} +{"current_steps": 110605, "total_steps": 119360, "loss": 0.3347, "lr": 1.6303252187474417e-07, "epoch": 18.533009383378015, "percentage": 92.67, "elapsed_time": "4:22:03", "remaining_time": "0:20:44", "throughput": 4077.75, "total_tokens": 64116656} +{"current_steps": 110610, "total_steps": 119360, "loss": 0.112, "lr": 1.628473969039318e-07, "epoch": 18.533847184986595, "percentage": 92.67, "elapsed_time": "4:22:04", "remaining_time": "0:20:43", "throughput": 4077.76, "total_tokens": 64119632} +{"current_steps": 110615, "total_steps": 119360, "loss": 0.2516, "lr": 1.626623753584461e-07, "epoch": 18.534684986595174, "percentage": 92.67, "elapsed_time": "4:22:04", "remaining_time": "0:20:43", "throughput": 4077.77, "total_tokens": 64122544} +{"current_steps": 110620, "total_steps": 119360, "loss": 0.264, "lr": 1.6247745724224274e-07, "epoch": 18.535522788203753, "percentage": 92.68, "elapsed_time": "4:22:05", "remaining_time": "0:20:42", "throughput": 4077.78, "total_tokens": 64125168} +{"current_steps": 110625, "total_steps": 119360, "loss": 0.6985, "lr": 1.6229264255927747e-07, "epoch": 18.536360589812332, "percentage": 92.68, "elapsed_time": "4:22:06", "remaining_time": "0:20:41", "throughput": 4077.78, "total_tokens": 64127888} +{"current_steps": 110630, "total_steps": 119360, "loss": 0.2978, "lr": 1.6210793131350045e-07, "epoch": 18.53719839142091, "percentage": 92.69, "elapsed_time": "4:22:06", "remaining_time": "0:20:41", "throughput": 4077.79, "total_tokens": 64130864} +{"current_steps": 110635, "total_steps": 119360, "loss": 0.5368, "lr": 1.6192332350886075e-07, "epoch": 18.53803619302949, "percentage": 92.69, "elapsed_time": "4:22:07", "remaining_time": "0:20:40", "throughput": 4077.8, "total_tokens": 64133872} +{"current_steps": 110640, "total_steps": 119360, "loss": 0.2394, "lr": 1.617388191493069e-07, "epoch": 18.53887399463807, "percentage": 92.69, "elapsed_time": "4:22:08", "remaining_time": "0:20:39", "throughput": 4077.82, "total_tokens": 64137008} +{"current_steps": 110645, "total_steps": 119360, "loss": 0.1976, "lr": 1.6155441823878237e-07, "epoch": 18.53971179624665, "percentage": 92.7, "elapsed_time": "4:22:08", "remaining_time": "0:20:38", "throughput": 4077.82, "total_tokens": 64139728} +{"current_steps": 110650, "total_steps": 119360, "loss": 0.2682, "lr": 1.6137012078123125e-07, "epoch": 18.54054959785523, "percentage": 92.7, "elapsed_time": "4:22:09", "remaining_time": "0:20:38", "throughput": 4077.83, "total_tokens": 64142704} +{"current_steps": 110655, "total_steps": 119360, "loss": 0.3399, "lr": 1.6118592678059374e-07, "epoch": 18.541387399463808, "percentage": 92.71, "elapsed_time": "4:22:10", "remaining_time": "0:20:37", "throughput": 4077.84, "total_tokens": 64145616} +{"current_steps": 110660, "total_steps": 119360, "loss": 0.4109, "lr": 1.6100183624080666e-07, "epoch": 18.542225201072387, "percentage": 92.71, "elapsed_time": "4:22:10", "remaining_time": "0:20:36", "throughput": 4077.85, "total_tokens": 64148592} +{"current_steps": 110665, "total_steps": 119360, "loss": 0.3443, "lr": 1.6081784916580856e-07, "epoch": 18.543063002680967, "percentage": 92.72, "elapsed_time": "4:22:11", "remaining_time": "0:20:36", "throughput": 4077.87, "total_tokens": 64151824} +{"current_steps": 110670, "total_steps": 119360, "loss": 0.6665, "lr": 1.6063396555953238e-07, "epoch": 18.543900804289546, "percentage": 92.72, "elapsed_time": "4:22:12", "remaining_time": "0:20:35", "throughput": 4077.88, "total_tokens": 64154832} +{"current_steps": 110675, "total_steps": 119360, "loss": 0.2895, "lr": 1.6045018542590883e-07, "epoch": 18.54473860589812, "percentage": 92.72, "elapsed_time": "4:22:13", "remaining_time": "0:20:34", "throughput": 4077.89, "total_tokens": 64157776} +{"current_steps": 110680, "total_steps": 119360, "loss": 0.3516, "lr": 1.6026650876886817e-07, "epoch": 18.5455764075067, "percentage": 92.73, "elapsed_time": "4:22:13", "remaining_time": "0:20:33", "throughput": 4077.91, "total_tokens": 64161104} +{"current_steps": 110685, "total_steps": 119360, "loss": 0.2529, "lr": 1.6008293559233834e-07, "epoch": 18.54641420911528, "percentage": 92.73, "elapsed_time": "4:22:14", "remaining_time": "0:20:33", "throughput": 4077.92, "total_tokens": 64164208} +{"current_steps": 110690, "total_steps": 119360, "loss": 0.3086, "lr": 1.598994659002434e-07, "epoch": 18.54725201072386, "percentage": 92.74, "elapsed_time": "4:22:15", "remaining_time": "0:20:32", "throughput": 4077.93, "total_tokens": 64166896} +{"current_steps": 110695, "total_steps": 119360, "loss": 0.5598, "lr": 1.5971609969650637e-07, "epoch": 18.54808981233244, "percentage": 92.74, "elapsed_time": "4:22:15", "remaining_time": "0:20:31", "throughput": 4077.94, "total_tokens": 64169776} +{"current_steps": 110700, "total_steps": 119360, "loss": 0.206, "lr": 1.595328369850485e-07, "epoch": 18.548927613941018, "percentage": 92.74, "elapsed_time": "4:22:16", "remaining_time": "0:20:31", "throughput": 4077.94, "total_tokens": 64172528} +{"current_steps": 110705, "total_steps": 119360, "loss": 0.3144, "lr": 1.5934967776978728e-07, "epoch": 18.549765415549597, "percentage": 92.75, "elapsed_time": "4:22:17", "remaining_time": "0:20:30", "throughput": 4077.95, "total_tokens": 64175376} +{"current_steps": 110710, "total_steps": 119360, "loss": 0.255, "lr": 1.5916662205463952e-07, "epoch": 18.550603217158177, "percentage": 92.75, "elapsed_time": "4:22:17", "remaining_time": "0:20:29", "throughput": 4077.96, "total_tokens": 64178192} +{"current_steps": 110715, "total_steps": 119360, "loss": 0.4807, "lr": 1.5898366984351988e-07, "epoch": 18.551441018766756, "percentage": 92.76, "elapsed_time": "4:22:18", "remaining_time": "0:20:28", "throughput": 4077.97, "total_tokens": 64181168} +{"current_steps": 110720, "total_steps": 119360, "loss": 0.4118, "lr": 1.5880082114033857e-07, "epoch": 18.552278820375335, "percentage": 92.76, "elapsed_time": "4:22:19", "remaining_time": "0:20:28", "throughput": 4077.97, "total_tokens": 64183856} +{"current_steps": 110725, "total_steps": 119360, "loss": 0.4747, "lr": 1.586180759490058e-07, "epoch": 18.553116621983914, "percentage": 92.77, "elapsed_time": "4:22:19", "remaining_time": "0:20:27", "throughput": 4077.98, "total_tokens": 64186768} +{"current_steps": 110730, "total_steps": 119360, "loss": 0.2891, "lr": 1.5843543427342956e-07, "epoch": 18.553954423592494, "percentage": 92.77, "elapsed_time": "4:22:20", "remaining_time": "0:20:26", "throughput": 4077.99, "total_tokens": 64189616} +{"current_steps": 110735, "total_steps": 119360, "loss": 0.1578, "lr": 1.582528961175145e-07, "epoch": 18.554792225201073, "percentage": 92.77, "elapsed_time": "4:22:21", "remaining_time": "0:20:26", "throughput": 4078.0, "total_tokens": 64192720} +{"current_steps": 110740, "total_steps": 119360, "loss": 0.3157, "lr": 1.5807046148516357e-07, "epoch": 18.555630026809652, "percentage": 92.78, "elapsed_time": "4:22:21", "remaining_time": "0:20:25", "throughput": 4078.01, "total_tokens": 64195472} +{"current_steps": 110745, "total_steps": 119360, "loss": 0.4062, "lr": 1.5788813038027762e-07, "epoch": 18.55646782841823, "percentage": 92.78, "elapsed_time": "4:22:22", "remaining_time": "0:20:24", "throughput": 4078.02, "total_tokens": 64198256} +{"current_steps": 110750, "total_steps": 119360, "loss": 0.3273, "lr": 1.5770590280675458e-07, "epoch": 18.55730563002681, "percentage": 92.79, "elapsed_time": "4:22:23", "remaining_time": "0:20:23", "throughput": 4078.03, "total_tokens": 64201104} +{"current_steps": 110755, "total_steps": 119360, "loss": 0.3531, "lr": 1.5752377876849133e-07, "epoch": 18.55814343163539, "percentage": 92.79, "elapsed_time": "4:22:23", "remaining_time": "0:20:23", "throughput": 4078.03, "total_tokens": 64203888} +{"current_steps": 110760, "total_steps": 119360, "loss": 0.6261, "lr": 1.5734175826938258e-07, "epoch": 18.55898123324397, "percentage": 92.79, "elapsed_time": "4:22:24", "remaining_time": "0:20:22", "throughput": 4078.04, "total_tokens": 64206608} +{"current_steps": 110765, "total_steps": 119360, "loss": 0.5333, "lr": 1.5715984131331796e-07, "epoch": 18.55981903485255, "percentage": 92.8, "elapsed_time": "4:22:25", "remaining_time": "0:20:21", "throughput": 4078.04, "total_tokens": 64209360} +{"current_steps": 110770, "total_steps": 119360, "loss": 0.2767, "lr": 1.5697802790418936e-07, "epoch": 18.560656836461128, "percentage": 92.8, "elapsed_time": "4:22:25", "remaining_time": "0:20:21", "throughput": 4078.05, "total_tokens": 64212272} +{"current_steps": 110775, "total_steps": 119360, "loss": 0.3731, "lr": 1.5679631804588424e-07, "epoch": 18.561494638069703, "percentage": 92.81, "elapsed_time": "4:22:26", "remaining_time": "0:20:20", "throughput": 4078.06, "total_tokens": 64215088} +{"current_steps": 110780, "total_steps": 119360, "loss": 0.3195, "lr": 1.5661471174228614e-07, "epoch": 18.562332439678283, "percentage": 92.81, "elapsed_time": "4:22:27", "remaining_time": "0:20:19", "throughput": 4078.07, "total_tokens": 64217904} +{"current_steps": 110785, "total_steps": 119360, "loss": 0.2953, "lr": 1.5643320899727809e-07, "epoch": 18.563170241286862, "percentage": 92.82, "elapsed_time": "4:22:27", "remaining_time": "0:20:18", "throughput": 4078.07, "total_tokens": 64220816} +{"current_steps": 110790, "total_steps": 119360, "loss": 0.2912, "lr": 1.5625180981474308e-07, "epoch": 18.56400804289544, "percentage": 92.82, "elapsed_time": "4:22:28", "remaining_time": "0:20:18", "throughput": 4078.09, "total_tokens": 64223792} +{"current_steps": 110795, "total_steps": 119360, "loss": 0.3482, "lr": 1.56070514198558e-07, "epoch": 18.56484584450402, "percentage": 92.82, "elapsed_time": "4:22:29", "remaining_time": "0:20:17", "throughput": 4078.09, "total_tokens": 64226512} +{"current_steps": 110800, "total_steps": 119360, "loss": 0.3828, "lr": 1.558893221525992e-07, "epoch": 18.5656836461126, "percentage": 92.83, "elapsed_time": "4:22:29", "remaining_time": "0:20:16", "throughput": 4078.1, "total_tokens": 64229264} +{"current_steps": 110805, "total_steps": 119360, "loss": 0.1783, "lr": 1.557082336807414e-07, "epoch": 18.56652144772118, "percentage": 92.83, "elapsed_time": "4:22:30", "remaining_time": "0:20:16", "throughput": 4078.11, "total_tokens": 64232240} +{"current_steps": 110810, "total_steps": 119360, "loss": 0.3478, "lr": 1.5552724878685643e-07, "epoch": 18.56735924932976, "percentage": 92.84, "elapsed_time": "4:22:31", "remaining_time": "0:20:15", "throughput": 4078.12, "total_tokens": 64235024} +{"current_steps": 110815, "total_steps": 119360, "loss": 0.3378, "lr": 1.55346367474814e-07, "epoch": 18.568197050938338, "percentage": 92.84, "elapsed_time": "4:22:31", "remaining_time": "0:20:14", "throughput": 4078.13, "total_tokens": 64237808} +{"current_steps": 110820, "total_steps": 119360, "loss": 0.2097, "lr": 1.551655897484816e-07, "epoch": 18.569034852546917, "percentage": 92.85, "elapsed_time": "4:22:32", "remaining_time": "0:20:13", "throughput": 4078.14, "total_tokens": 64240912} +{"current_steps": 110825, "total_steps": 119360, "loss": 0.3234, "lr": 1.5498491561172335e-07, "epoch": 18.569872654155496, "percentage": 92.85, "elapsed_time": "4:22:33", "remaining_time": "0:20:13", "throughput": 4078.15, "total_tokens": 64243920} +{"current_steps": 110830, "total_steps": 119360, "loss": 0.145, "lr": 1.5480434506840447e-07, "epoch": 18.570710455764075, "percentage": 92.85, "elapsed_time": "4:22:33", "remaining_time": "0:20:12", "throughput": 4078.17, "total_tokens": 64246800} +{"current_steps": 110835, "total_steps": 119360, "loss": 0.4611, "lr": 1.5462387812238467e-07, "epoch": 18.571548257372655, "percentage": 92.86, "elapsed_time": "4:22:34", "remaining_time": "0:20:11", "throughput": 4078.17, "total_tokens": 64249744} +{"current_steps": 110840, "total_steps": 119360, "loss": 0.56, "lr": 1.544435147775225e-07, "epoch": 18.572386058981234, "percentage": 92.86, "elapsed_time": "4:22:35", "remaining_time": "0:20:11", "throughput": 4078.19, "total_tokens": 64252656} +{"current_steps": 110845, "total_steps": 119360, "loss": 0.2883, "lr": 1.5426325503767437e-07, "epoch": 18.573223860589813, "percentage": 92.87, "elapsed_time": "4:22:35", "remaining_time": "0:20:10", "throughput": 4078.2, "total_tokens": 64255696} +{"current_steps": 110850, "total_steps": 119360, "loss": 0.4835, "lr": 1.5408309890669493e-07, "epoch": 18.574061662198392, "percentage": 92.87, "elapsed_time": "4:22:36", "remaining_time": "0:20:09", "throughput": 4078.2, "total_tokens": 64258384} +{"current_steps": 110855, "total_steps": 119360, "loss": 0.2323, "lr": 1.5390304638843555e-07, "epoch": 18.57489946380697, "percentage": 92.87, "elapsed_time": "4:22:37", "remaining_time": "0:20:08", "throughput": 4078.21, "total_tokens": 64261328} +{"current_steps": 110860, "total_steps": 119360, "loss": 0.3045, "lr": 1.5372309748674652e-07, "epoch": 18.57573726541555, "percentage": 92.88, "elapsed_time": "4:22:37", "remaining_time": "0:20:08", "throughput": 4078.22, "total_tokens": 64264016} +{"current_steps": 110865, "total_steps": 119360, "loss": 0.1723, "lr": 1.5354325220547638e-07, "epoch": 18.57657506702413, "percentage": 92.88, "elapsed_time": "4:22:38", "remaining_time": "0:20:07", "throughput": 4078.22, "total_tokens": 64266704} +{"current_steps": 110870, "total_steps": 119360, "loss": 0.4873, "lr": 1.5336351054846764e-07, "epoch": 18.577412868632706, "percentage": 92.89, "elapsed_time": "4:22:39", "remaining_time": "0:20:06", "throughput": 4078.23, "total_tokens": 64269776} +{"current_steps": 110875, "total_steps": 119360, "loss": 0.5072, "lr": 1.5318387251956558e-07, "epoch": 18.578250670241285, "percentage": 92.89, "elapsed_time": "4:22:39", "remaining_time": "0:20:06", "throughput": 4078.24, "total_tokens": 64272976} +{"current_steps": 110880, "total_steps": 119360, "loss": 0.1645, "lr": 1.5300433812261206e-07, "epoch": 18.579088471849865, "percentage": 92.9, "elapsed_time": "4:22:40", "remaining_time": "0:20:05", "throughput": 4078.26, "total_tokens": 64275920} +{"current_steps": 110885, "total_steps": 119360, "loss": 0.2856, "lr": 1.5282490736144352e-07, "epoch": 18.579926273458444, "percentage": 92.9, "elapsed_time": "4:22:41", "remaining_time": "0:20:04", "throughput": 4078.27, "total_tokens": 64278832} +{"current_steps": 110890, "total_steps": 119360, "loss": 0.3699, "lr": 1.526455802398963e-07, "epoch": 18.580764075067023, "percentage": 92.9, "elapsed_time": "4:22:41", "remaining_time": "0:20:03", "throughput": 4078.27, "total_tokens": 64281552} +{"current_steps": 110895, "total_steps": 119360, "loss": 0.2962, "lr": 1.5246635676180733e-07, "epoch": 18.581601876675602, "percentage": 92.91, "elapsed_time": "4:22:42", "remaining_time": "0:20:03", "throughput": 4078.29, "total_tokens": 64284560} +{"current_steps": 110900, "total_steps": 119360, "loss": 0.5155, "lr": 1.522872369310069e-07, "epoch": 18.58243967828418, "percentage": 92.91, "elapsed_time": "4:22:43", "remaining_time": "0:20:02", "throughput": 4078.29, "total_tokens": 64287504} +{"current_steps": 110905, "total_steps": 119360, "loss": 0.3406, "lr": 1.521082207513247e-07, "epoch": 18.58327747989276, "percentage": 92.92, "elapsed_time": "4:22:44", "remaining_time": "0:20:01", "throughput": 4078.3, "total_tokens": 64290320} +{"current_steps": 110910, "total_steps": 119360, "loss": 0.3596, "lr": 1.5192930822658824e-07, "epoch": 18.58411528150134, "percentage": 92.92, "elapsed_time": "4:22:44", "remaining_time": "0:20:01", "throughput": 4078.3, "total_tokens": 64292848} +{"current_steps": 110915, "total_steps": 119360, "loss": 0.1955, "lr": 1.517504993606239e-07, "epoch": 18.58495308310992, "percentage": 92.92, "elapsed_time": "4:22:45", "remaining_time": "0:20:00", "throughput": 4078.31, "total_tokens": 64295792} +{"current_steps": 110920, "total_steps": 119360, "loss": 0.5802, "lr": 1.515717941572542e-07, "epoch": 18.5857908847185, "percentage": 92.93, "elapsed_time": "4:22:45", "remaining_time": "0:19:59", "throughput": 4078.32, "total_tokens": 64298672} +{"current_steps": 110925, "total_steps": 119360, "loss": 0.6397, "lr": 1.5139319262030107e-07, "epoch": 18.586628686327078, "percentage": 92.93, "elapsed_time": "4:22:46", "remaining_time": "0:19:58", "throughput": 4078.33, "total_tokens": 64301584} +{"current_steps": 110930, "total_steps": 119360, "loss": 0.4563, "lr": 1.512146947535814e-07, "epoch": 18.587466487935657, "percentage": 92.94, "elapsed_time": "4:22:47", "remaining_time": "0:19:58", "throughput": 4078.34, "total_tokens": 64304272} +{"current_steps": 110935, "total_steps": 119360, "loss": 0.3785, "lr": 1.510363005609128e-07, "epoch": 18.588304289544237, "percentage": 92.94, "elapsed_time": "4:22:47", "remaining_time": "0:19:57", "throughput": 4078.35, "total_tokens": 64307248} +{"current_steps": 110940, "total_steps": 119360, "loss": 0.2157, "lr": 1.5085801004611046e-07, "epoch": 18.589142091152816, "percentage": 92.95, "elapsed_time": "4:22:48", "remaining_time": "0:19:56", "throughput": 4078.36, "total_tokens": 64310320} +{"current_steps": 110945, "total_steps": 119360, "loss": 0.3463, "lr": 1.5067982321298523e-07, "epoch": 18.589979892761395, "percentage": 92.95, "elapsed_time": "4:22:49", "remaining_time": "0:19:56", "throughput": 4078.38, "total_tokens": 64313424} +{"current_steps": 110950, "total_steps": 119360, "loss": 0.335, "lr": 1.5050174006534747e-07, "epoch": 18.590817694369974, "percentage": 92.95, "elapsed_time": "4:22:49", "remaining_time": "0:19:55", "throughput": 4078.38, "total_tokens": 64316080} +{"current_steps": 110955, "total_steps": 119360, "loss": 0.52, "lr": 1.503237606070046e-07, "epoch": 18.591655495978554, "percentage": 92.96, "elapsed_time": "4:22:50", "remaining_time": "0:19:54", "throughput": 4078.39, "total_tokens": 64318800} +{"current_steps": 110960, "total_steps": 119360, "loss": 0.3725, "lr": 1.5014588484176253e-07, "epoch": 18.592493297587133, "percentage": 92.96, "elapsed_time": "4:22:51", "remaining_time": "0:19:53", "throughput": 4078.4, "total_tokens": 64321648} +{"current_steps": 110965, "total_steps": 119360, "loss": 0.364, "lr": 1.499681127734237e-07, "epoch": 18.593331099195712, "percentage": 92.97, "elapsed_time": "4:22:51", "remaining_time": "0:19:53", "throughput": 4078.4, "total_tokens": 64324240} +{"current_steps": 110970, "total_steps": 119360, "loss": 0.4426, "lr": 1.4979044440579015e-07, "epoch": 18.594168900804288, "percentage": 92.97, "elapsed_time": "4:22:52", "remaining_time": "0:19:52", "throughput": 4078.42, "total_tokens": 64327408} +{"current_steps": 110975, "total_steps": 119360, "loss": 0.1245, "lr": 1.4961287974265992e-07, "epoch": 18.595006702412867, "percentage": 92.98, "elapsed_time": "4:22:53", "remaining_time": "0:19:51", "throughput": 4078.43, "total_tokens": 64330160} +{"current_steps": 110980, "total_steps": 119360, "loss": 0.2422, "lr": 1.4943541878782997e-07, "epoch": 18.595844504021446, "percentage": 92.98, "elapsed_time": "4:22:53", "remaining_time": "0:19:51", "throughput": 4078.44, "total_tokens": 64333104} +{"current_steps": 110985, "total_steps": 119360, "loss": 0.2695, "lr": 1.4925806154509504e-07, "epoch": 18.596682305630026, "percentage": 92.98, "elapsed_time": "4:22:54", "remaining_time": "0:19:50", "throughput": 4078.45, "total_tokens": 64336400} +{"current_steps": 110990, "total_steps": 119360, "loss": 0.6218, "lr": 1.49080808018246e-07, "epoch": 18.597520107238605, "percentage": 92.99, "elapsed_time": "4:22:55", "remaining_time": "0:19:49", "throughput": 4078.46, "total_tokens": 64339088} +{"current_steps": 110995, "total_steps": 119360, "loss": 0.395, "lr": 1.4890365821107423e-07, "epoch": 18.598357908847184, "percentage": 92.99, "elapsed_time": "4:22:55", "remaining_time": "0:19:48", "throughput": 4078.47, "total_tokens": 64341776} +{"current_steps": 111000, "total_steps": 119360, "loss": 0.5035, "lr": 1.4872661212736729e-07, "epoch": 18.599195710455763, "percentage": 93.0, "elapsed_time": "4:22:56", "remaining_time": "0:19:48", "throughput": 4078.48, "total_tokens": 64344688} +{"current_steps": 111005, "total_steps": 119360, "loss": 0.2721, "lr": 1.4854966977090934e-07, "epoch": 18.600033512064343, "percentage": 93.0, "elapsed_time": "4:22:57", "remaining_time": "0:19:47", "throughput": 4078.49, "total_tokens": 64347568} +{"current_steps": 111010, "total_steps": 119360, "loss": 0.3347, "lr": 1.4837283114548518e-07, "epoch": 18.600871313672922, "percentage": 93.0, "elapsed_time": "4:22:57", "remaining_time": "0:19:46", "throughput": 4078.5, "total_tokens": 64350384} +{"current_steps": 111015, "total_steps": 119360, "loss": 0.6342, "lr": 1.4819609625487453e-07, "epoch": 18.6017091152815, "percentage": 93.01, "elapsed_time": "4:22:58", "remaining_time": "0:19:46", "throughput": 4078.51, "total_tokens": 64353520} +{"current_steps": 111020, "total_steps": 119360, "loss": 0.2222, "lr": 1.480194651028577e-07, "epoch": 18.60254691689008, "percentage": 93.01, "elapsed_time": "4:22:59", "remaining_time": "0:19:45", "throughput": 4078.52, "total_tokens": 64356336} +{"current_steps": 111025, "total_steps": 119360, "loss": 0.2447, "lr": 1.4784293769321e-07, "epoch": 18.60338471849866, "percentage": 93.02, "elapsed_time": "4:23:00", "remaining_time": "0:19:44", "throughput": 4078.53, "total_tokens": 64359344} +{"current_steps": 111030, "total_steps": 119360, "loss": 0.4719, "lr": 1.4766651402970733e-07, "epoch": 18.60422252010724, "percentage": 93.02, "elapsed_time": "4:23:00", "remaining_time": "0:19:43", "throughput": 4078.54, "total_tokens": 64362224} +{"current_steps": 111035, "total_steps": 119360, "loss": 0.4172, "lr": 1.4749019411611998e-07, "epoch": 18.60506032171582, "percentage": 93.03, "elapsed_time": "4:23:01", "remaining_time": "0:19:43", "throughput": 4078.55, "total_tokens": 64365328} +{"current_steps": 111040, "total_steps": 119360, "loss": 0.4332, "lr": 1.4731397795621882e-07, "epoch": 18.605898123324398, "percentage": 93.03, "elapsed_time": "4:23:02", "remaining_time": "0:19:42", "throughput": 4078.56, "total_tokens": 64368208} +{"current_steps": 111045, "total_steps": 119360, "loss": 0.3471, "lr": 1.4713786555377308e-07, "epoch": 18.606735924932977, "percentage": 93.03, "elapsed_time": "4:23:02", "remaining_time": "0:19:41", "throughput": 4078.57, "total_tokens": 64370960} +{"current_steps": 111050, "total_steps": 119360, "loss": 0.407, "lr": 1.4696185691254583e-07, "epoch": 18.607573726541556, "percentage": 93.04, "elapsed_time": "4:23:03", "remaining_time": "0:19:41", "throughput": 4078.58, "total_tokens": 64373712} +{"current_steps": 111055, "total_steps": 119360, "loss": 0.5197, "lr": 1.4678595203630186e-07, "epoch": 18.608411528150135, "percentage": 93.04, "elapsed_time": "4:23:04", "remaining_time": "0:19:40", "throughput": 4078.59, "total_tokens": 64376560} +{"current_steps": 111060, "total_steps": 119360, "loss": 0.6479, "lr": 1.4661015092880149e-07, "epoch": 18.609249329758715, "percentage": 93.05, "elapsed_time": "4:23:04", "remaining_time": "0:19:39", "throughput": 4078.6, "total_tokens": 64379568} +{"current_steps": 111065, "total_steps": 119360, "loss": 0.2684, "lr": 1.4643445359380393e-07, "epoch": 18.610087131367294, "percentage": 93.05, "elapsed_time": "4:23:05", "remaining_time": "0:19:38", "throughput": 4078.61, "total_tokens": 64382480} +{"current_steps": 111070, "total_steps": 119360, "loss": 0.3853, "lr": 1.4625886003506617e-07, "epoch": 18.61092493297587, "percentage": 93.05, "elapsed_time": "4:23:06", "remaining_time": "0:19:38", "throughput": 4078.62, "total_tokens": 64385552} +{"current_steps": 111075, "total_steps": 119360, "loss": 0.2853, "lr": 1.4608337025634244e-07, "epoch": 18.61176273458445, "percentage": 93.06, "elapsed_time": "4:23:06", "remaining_time": "0:19:37", "throughput": 4078.64, "total_tokens": 64388464} +{"current_steps": 111080, "total_steps": 119360, "loss": 0.6029, "lr": 1.459079842613853e-07, "epoch": 18.61260053619303, "percentage": 93.06, "elapsed_time": "4:23:07", "remaining_time": "0:19:36", "throughput": 4078.65, "total_tokens": 64391312} +{"current_steps": 111085, "total_steps": 119360, "loss": 0.1932, "lr": 1.4573270205394396e-07, "epoch": 18.613438337801608, "percentage": 93.07, "elapsed_time": "4:23:08", "remaining_time": "0:19:36", "throughput": 4078.65, "total_tokens": 64394064} +{"current_steps": 111090, "total_steps": 119360, "loss": 0.2297, "lr": 1.455575236377671e-07, "epoch": 18.614276139410187, "percentage": 93.07, "elapsed_time": "4:23:08", "remaining_time": "0:19:35", "throughput": 4078.66, "total_tokens": 64397072} +{"current_steps": 111095, "total_steps": 119360, "loss": 0.3482, "lr": 1.4538244901659892e-07, "epoch": 18.615113941018766, "percentage": 93.08, "elapsed_time": "4:23:09", "remaining_time": "0:19:34", "throughput": 4078.67, "total_tokens": 64399856} +{"current_steps": 111100, "total_steps": 119360, "loss": 0.4971, "lr": 1.452074781941848e-07, "epoch": 18.615951742627345, "percentage": 93.08, "elapsed_time": "4:23:10", "remaining_time": "0:19:33", "throughput": 4078.69, "total_tokens": 64402896} +{"current_steps": 111105, "total_steps": 119360, "loss": 0.2021, "lr": 1.4503261117426392e-07, "epoch": 18.616789544235925, "percentage": 93.08, "elapsed_time": "4:23:10", "remaining_time": "0:19:33", "throughput": 4078.7, "total_tokens": 64405840} +{"current_steps": 111110, "total_steps": 119360, "loss": 0.4799, "lr": 1.4485784796057667e-07, "epoch": 18.617627345844504, "percentage": 93.09, "elapsed_time": "4:23:11", "remaining_time": "0:19:32", "throughput": 4078.7, "total_tokens": 64408464} +{"current_steps": 111115, "total_steps": 119360, "loss": 0.3544, "lr": 1.4468318855685838e-07, "epoch": 18.618465147453083, "percentage": 93.09, "elapsed_time": "4:23:12", "remaining_time": "0:19:31", "throughput": 4078.71, "total_tokens": 64411184} +{"current_steps": 111120, "total_steps": 119360, "loss": 0.2493, "lr": 1.4450863296684436e-07, "epoch": 18.619302949061662, "percentage": 93.1, "elapsed_time": "4:23:12", "remaining_time": "0:19:31", "throughput": 4078.71, "total_tokens": 64413936} +{"current_steps": 111125, "total_steps": 119360, "loss": 0.355, "lr": 1.4433418119426724e-07, "epoch": 18.62014075067024, "percentage": 93.1, "elapsed_time": "4:23:13", "remaining_time": "0:19:30", "throughput": 4078.72, "total_tokens": 64417104} +{"current_steps": 111130, "total_steps": 119360, "loss": 0.1308, "lr": 1.441598332428562e-07, "epoch": 18.62097855227882, "percentage": 93.1, "elapsed_time": "4:23:14", "remaining_time": "0:19:29", "throughput": 4078.74, "total_tokens": 64420240} +{"current_steps": 111135, "total_steps": 119360, "loss": 0.3135, "lr": 1.4398558911633941e-07, "epoch": 18.6218163538874, "percentage": 93.11, "elapsed_time": "4:23:14", "remaining_time": "0:19:28", "throughput": 4078.75, "total_tokens": 64423152} +{"current_steps": 111140, "total_steps": 119360, "loss": 0.501, "lr": 1.4381144881844222e-07, "epoch": 18.62265415549598, "percentage": 93.11, "elapsed_time": "4:23:15", "remaining_time": "0:19:28", "throughput": 4078.75, "total_tokens": 64425904} +{"current_steps": 111145, "total_steps": 119360, "loss": 0.3927, "lr": 1.4363741235288832e-07, "epoch": 18.62349195710456, "percentage": 93.12, "elapsed_time": "4:23:16", "remaining_time": "0:19:27", "throughput": 4078.76, "total_tokens": 64428656} +{"current_steps": 111150, "total_steps": 119360, "loss": 0.1912, "lr": 1.4346347972339913e-07, "epoch": 18.624329758713138, "percentage": 93.12, "elapsed_time": "4:23:16", "remaining_time": "0:19:26", "throughput": 4078.77, "total_tokens": 64431440} +{"current_steps": 111155, "total_steps": 119360, "loss": 0.4628, "lr": 1.4328965093369284e-07, "epoch": 18.625167560321717, "percentage": 93.13, "elapsed_time": "4:23:17", "remaining_time": "0:19:26", "throughput": 4078.77, "total_tokens": 64433936} +{"current_steps": 111160, "total_steps": 119360, "loss": 0.1935, "lr": 1.43115925987487e-07, "epoch": 18.626005361930297, "percentage": 93.13, "elapsed_time": "4:23:18", "remaining_time": "0:19:25", "throughput": 4078.79, "total_tokens": 64437072} +{"current_steps": 111165, "total_steps": 119360, "loss": 0.3136, "lr": 1.4294230488849537e-07, "epoch": 18.626843163538872, "percentage": 93.13, "elapsed_time": "4:23:18", "remaining_time": "0:19:24", "throughput": 4078.79, "total_tokens": 64439888} +{"current_steps": 111170, "total_steps": 119360, "loss": 0.2342, "lr": 1.4276878764043046e-07, "epoch": 18.62768096514745, "percentage": 93.14, "elapsed_time": "4:23:19", "remaining_time": "0:19:23", "throughput": 4078.81, "total_tokens": 64442896} +{"current_steps": 111175, "total_steps": 119360, "loss": 0.2668, "lr": 1.425953742470021e-07, "epoch": 18.62851876675603, "percentage": 93.14, "elapsed_time": "4:23:20", "remaining_time": "0:19:23", "throughput": 4078.82, "total_tokens": 64445680} +{"current_steps": 111180, "total_steps": 119360, "loss": 0.2827, "lr": 1.4242206471191843e-07, "epoch": 18.62935656836461, "percentage": 93.15, "elapsed_time": "4:23:20", "remaining_time": "0:19:22", "throughput": 4078.82, "total_tokens": 64448432} +{"current_steps": 111185, "total_steps": 119360, "loss": 0.2974, "lr": 1.4224885903888541e-07, "epoch": 18.63019436997319, "percentage": 93.15, "elapsed_time": "4:23:21", "remaining_time": "0:19:21", "throughput": 4078.83, "total_tokens": 64451120} +{"current_steps": 111190, "total_steps": 119360, "loss": 0.2728, "lr": 1.420757572316056e-07, "epoch": 18.63103217158177, "percentage": 93.16, "elapsed_time": "4:23:22", "remaining_time": "0:19:21", "throughput": 4078.85, "total_tokens": 64454352} +{"current_steps": 111195, "total_steps": 119360, "loss": 0.2768, "lr": 1.4190275929378107e-07, "epoch": 18.631869973190348, "percentage": 93.16, "elapsed_time": "4:23:22", "remaining_time": "0:19:20", "throughput": 4078.86, "total_tokens": 64457456} +{"current_steps": 111200, "total_steps": 119360, "loss": 0.2741, "lr": 1.4172986522910936e-07, "epoch": 18.632707774798927, "percentage": 93.16, "elapsed_time": "4:23:23", "remaining_time": "0:19:19", "throughput": 4078.86, "total_tokens": 64460336} +{"current_steps": 111205, "total_steps": 119360, "loss": 0.1877, "lr": 1.4155707504128924e-07, "epoch": 18.633545576407506, "percentage": 93.17, "elapsed_time": "4:23:24", "remaining_time": "0:19:18", "throughput": 4078.87, "total_tokens": 64463504} +{"current_steps": 111210, "total_steps": 119360, "loss": 0.3851, "lr": 1.4138438873401384e-07, "epoch": 18.634383378016086, "percentage": 93.17, "elapsed_time": "4:23:24", "remaining_time": "0:19:18", "throughput": 4078.88, "total_tokens": 64466256} +{"current_steps": 111215, "total_steps": 119360, "loss": 0.2041, "lr": 1.412118063109752e-07, "epoch": 18.635221179624665, "percentage": 93.18, "elapsed_time": "4:23:25", "remaining_time": "0:19:17", "throughput": 4078.89, "total_tokens": 64469104} +{"current_steps": 111220, "total_steps": 119360, "loss": 0.2815, "lr": 1.4103932777586428e-07, "epoch": 18.636058981233244, "percentage": 93.18, "elapsed_time": "4:23:26", "remaining_time": "0:19:16", "throughput": 4078.91, "total_tokens": 64472208} +{"current_steps": 111225, "total_steps": 119360, "loss": 0.2723, "lr": 1.408669531323681e-07, "epoch": 18.636896782841823, "percentage": 93.18, "elapsed_time": "4:23:26", "remaining_time": "0:19:16", "throughput": 4078.91, "total_tokens": 64474832} +{"current_steps": 111230, "total_steps": 119360, "loss": 0.3746, "lr": 1.4069468238417316e-07, "epoch": 18.637734584450403, "percentage": 93.19, "elapsed_time": "4:23:27", "remaining_time": "0:19:15", "throughput": 4078.92, "total_tokens": 64477552} +{"current_steps": 111235, "total_steps": 119360, "loss": 0.2588, "lr": 1.405225155349621e-07, "epoch": 18.638572386058982, "percentage": 93.19, "elapsed_time": "4:23:28", "remaining_time": "0:19:14", "throughput": 4078.93, "total_tokens": 64480464} +{"current_steps": 111240, "total_steps": 119360, "loss": 0.212, "lr": 1.403504525884164e-07, "epoch": 18.63941018766756, "percentage": 93.2, "elapsed_time": "4:23:28", "remaining_time": "0:19:13", "throughput": 4078.94, "total_tokens": 64483504} +{"current_steps": 111245, "total_steps": 119360, "loss": 0.2448, "lr": 1.4017849354821477e-07, "epoch": 18.64024798927614, "percentage": 93.2, "elapsed_time": "4:23:29", "remaining_time": "0:19:13", "throughput": 4078.95, "total_tokens": 64486416} +{"current_steps": 111250, "total_steps": 119360, "loss": 0.7701, "lr": 1.400066384180343e-07, "epoch": 18.64108579088472, "percentage": 93.21, "elapsed_time": "4:23:30", "remaining_time": "0:19:12", "throughput": 4078.95, "total_tokens": 64489040} +{"current_steps": 111255, "total_steps": 119360, "loss": 0.3258, "lr": 1.3983488720155037e-07, "epoch": 18.6419235924933, "percentage": 93.21, "elapsed_time": "4:23:30", "remaining_time": "0:19:11", "throughput": 4078.96, "total_tokens": 64491856} +{"current_steps": 111260, "total_steps": 119360, "loss": 0.4044, "lr": 1.396632399024328e-07, "epoch": 18.64276139410188, "percentage": 93.21, "elapsed_time": "4:23:31", "remaining_time": "0:19:11", "throughput": 4078.96, "total_tokens": 64494608} +{"current_steps": 111265, "total_steps": 119360, "loss": 0.3919, "lr": 1.3949169652435424e-07, "epoch": 18.643599195710454, "percentage": 93.22, "elapsed_time": "4:23:32", "remaining_time": "0:19:10", "throughput": 4078.97, "total_tokens": 64497424} +{"current_steps": 111270, "total_steps": 119360, "loss": 0.1868, "lr": 1.393202570709812e-07, "epoch": 18.644436997319033, "percentage": 93.22, "elapsed_time": "4:23:32", "remaining_time": "0:19:09", "throughput": 4078.99, "total_tokens": 64500464} +{"current_steps": 111275, "total_steps": 119360, "loss": 0.155, "lr": 1.3914892154597904e-07, "epoch": 18.645274798927613, "percentage": 93.23, "elapsed_time": "4:23:33", "remaining_time": "0:19:08", "throughput": 4078.99, "total_tokens": 64503120} +{"current_steps": 111280, "total_steps": 119360, "loss": 0.3034, "lr": 1.389776899530121e-07, "epoch": 18.646112600536192, "percentage": 93.23, "elapsed_time": "4:23:34", "remaining_time": "0:19:08", "throughput": 4079.0, "total_tokens": 64506320} +{"current_steps": 111285, "total_steps": 119360, "loss": 0.3485, "lr": 1.3880656229574074e-07, "epoch": 18.64695040214477, "percentage": 93.23, "elapsed_time": "4:23:34", "remaining_time": "0:19:07", "throughput": 4079.02, "total_tokens": 64509296} +{"current_steps": 111290, "total_steps": 119360, "loss": 0.7163, "lr": 1.3863553857782485e-07, "epoch": 18.64778820375335, "percentage": 93.24, "elapsed_time": "4:23:35", "remaining_time": "0:19:06", "throughput": 4079.03, "total_tokens": 64512112} +{"current_steps": 111295, "total_steps": 119360, "loss": 0.3306, "lr": 1.3846461880291985e-07, "epoch": 18.64862600536193, "percentage": 93.24, "elapsed_time": "4:23:36", "remaining_time": "0:19:06", "throughput": 4079.04, "total_tokens": 64515216} +{"current_steps": 111300, "total_steps": 119360, "loss": 0.3832, "lr": 1.3829380297468164e-07, "epoch": 18.64946380697051, "percentage": 93.25, "elapsed_time": "4:23:36", "remaining_time": "0:19:05", "throughput": 4079.05, "total_tokens": 64518128} +{"current_steps": 111305, "total_steps": 119360, "loss": 0.3343, "lr": 1.381230910967618e-07, "epoch": 18.65030160857909, "percentage": 93.25, "elapsed_time": "4:23:37", "remaining_time": "0:19:04", "throughput": 4079.05, "total_tokens": 64521008} +{"current_steps": 111310, "total_steps": 119360, "loss": 0.3805, "lr": 1.3795248317281073e-07, "epoch": 18.651139410187668, "percentage": 93.26, "elapsed_time": "4:23:38", "remaining_time": "0:19:03", "throughput": 4079.07, "total_tokens": 64524208} +{"current_steps": 111315, "total_steps": 119360, "loss": 0.2548, "lr": 1.3778197920647552e-07, "epoch": 18.651977211796247, "percentage": 93.26, "elapsed_time": "4:23:39", "remaining_time": "0:19:03", "throughput": 4079.08, "total_tokens": 64527312} +{"current_steps": 111320, "total_steps": 119360, "loss": 0.3922, "lr": 1.376115792014021e-07, "epoch": 18.652815013404826, "percentage": 93.26, "elapsed_time": "4:23:39", "remaining_time": "0:19:02", "throughput": 4079.09, "total_tokens": 64530192} +{"current_steps": 111325, "total_steps": 119360, "loss": 0.4299, "lr": 1.3744128316123485e-07, "epoch": 18.653652815013405, "percentage": 93.27, "elapsed_time": "4:23:40", "remaining_time": "0:19:01", "throughput": 4079.1, "total_tokens": 64532880} +{"current_steps": 111330, "total_steps": 119360, "loss": 0.3286, "lr": 1.3727109108961357e-07, "epoch": 18.654490616621985, "percentage": 93.27, "elapsed_time": "4:23:41", "remaining_time": "0:19:01", "throughput": 4079.11, "total_tokens": 64535728} +{"current_steps": 111335, "total_steps": 119360, "loss": 0.625, "lr": 1.3710100299017814e-07, "epoch": 18.655328418230564, "percentage": 93.28, "elapsed_time": "4:23:41", "remaining_time": "0:19:00", "throughput": 4079.12, "total_tokens": 64538896} +{"current_steps": 111340, "total_steps": 119360, "loss": 0.3408, "lr": 1.3693101886656456e-07, "epoch": 18.656166219839143, "percentage": 93.28, "elapsed_time": "4:23:42", "remaining_time": "0:18:59", "throughput": 4079.13, "total_tokens": 64541776} +{"current_steps": 111345, "total_steps": 119360, "loss": 0.3263, "lr": 1.367611387224077e-07, "epoch": 18.657004021447722, "percentage": 93.29, "elapsed_time": "4:23:43", "remaining_time": "0:18:59", "throughput": 4079.14, "total_tokens": 64544784} +{"current_steps": 111350, "total_steps": 119360, "loss": 0.8292, "lr": 1.365913625613402e-07, "epoch": 18.6578418230563, "percentage": 93.29, "elapsed_time": "4:23:43", "remaining_time": "0:18:58", "throughput": 4079.16, "total_tokens": 64547824} +{"current_steps": 111355, "total_steps": 119360, "loss": 0.3909, "lr": 1.3642169038699248e-07, "epoch": 18.65867962466488, "percentage": 93.29, "elapsed_time": "4:23:44", "remaining_time": "0:18:57", "throughput": 4079.17, "total_tokens": 64550800} +{"current_steps": 111360, "total_steps": 119360, "loss": 0.4836, "lr": 1.3625212220299e-07, "epoch": 18.65951742627346, "percentage": 93.3, "elapsed_time": "4:23:45", "remaining_time": "0:18:56", "throughput": 4079.18, "total_tokens": 64553776} +{"current_steps": 111365, "total_steps": 119360, "loss": 0.4552, "lr": 1.3608265801296095e-07, "epoch": 18.660355227882036, "percentage": 93.3, "elapsed_time": "4:23:45", "remaining_time": "0:18:56", "throughput": 4079.19, "total_tokens": 64556624} +{"current_steps": 111370, "total_steps": 119360, "loss": 0.5154, "lr": 1.3591329782052854e-07, "epoch": 18.661193029490615, "percentage": 93.31, "elapsed_time": "4:23:46", "remaining_time": "0:18:55", "throughput": 4079.19, "total_tokens": 64559248} +{"current_steps": 111375, "total_steps": 119360, "loss": 0.5412, "lr": 1.3574404162931265e-07, "epoch": 18.662030831099194, "percentage": 93.31, "elapsed_time": "4:23:47", "remaining_time": "0:18:54", "throughput": 4079.2, "total_tokens": 64561936} +{"current_steps": 111380, "total_steps": 119360, "loss": 0.3946, "lr": 1.3557488944293263e-07, "epoch": 18.662868632707774, "percentage": 93.31, "elapsed_time": "4:23:47", "remaining_time": "0:18:54", "throughput": 4079.21, "total_tokens": 64564720} +{"current_steps": 111385, "total_steps": 119360, "loss": 0.2443, "lr": 1.3540584126500555e-07, "epoch": 18.663706434316353, "percentage": 93.32, "elapsed_time": "4:23:48", "remaining_time": "0:18:53", "throughput": 4079.22, "total_tokens": 64567600} +{"current_steps": 111390, "total_steps": 119360, "loss": 0.4778, "lr": 1.3523689709914524e-07, "epoch": 18.664544235924932, "percentage": 93.32, "elapsed_time": "4:23:49", "remaining_time": "0:18:52", "throughput": 4079.23, "total_tokens": 64570832} +{"current_steps": 111395, "total_steps": 119360, "loss": 0.2919, "lr": 1.3506805694896486e-07, "epoch": 18.66538203753351, "percentage": 93.33, "elapsed_time": "4:23:49", "remaining_time": "0:18:51", "throughput": 4079.24, "total_tokens": 64573712} +{"current_steps": 111400, "total_steps": 119360, "loss": 0.2537, "lr": 1.3489932081807434e-07, "epoch": 18.66621983914209, "percentage": 93.33, "elapsed_time": "4:23:50", "remaining_time": "0:18:51", "throughput": 4079.26, "total_tokens": 64576880} +{"current_steps": 111405, "total_steps": 119360, "loss": 0.098, "lr": 1.3473068871008077e-07, "epoch": 18.66705764075067, "percentage": 93.34, "elapsed_time": "4:23:51", "remaining_time": "0:18:50", "throughput": 4079.27, "total_tokens": 64579792} +{"current_steps": 111410, "total_steps": 119360, "loss": 0.221, "lr": 1.3456216062859017e-07, "epoch": 18.66789544235925, "percentage": 93.34, "elapsed_time": "4:23:51", "remaining_time": "0:18:49", "throughput": 4079.28, "total_tokens": 64582768} +{"current_steps": 111415, "total_steps": 119360, "loss": 0.2377, "lr": 1.343937365772069e-07, "epoch": 18.66873324396783, "percentage": 93.34, "elapsed_time": "4:23:52", "remaining_time": "0:18:49", "throughput": 4079.29, "total_tokens": 64585808} +{"current_steps": 111420, "total_steps": 119360, "loss": 0.3441, "lr": 1.3422541655953024e-07, "epoch": 18.669571045576408, "percentage": 93.35, "elapsed_time": "4:23:53", "remaining_time": "0:18:48", "throughput": 4079.3, "total_tokens": 64588752} +{"current_steps": 111425, "total_steps": 119360, "loss": 0.5643, "lr": 1.340572005791596e-07, "epoch": 18.670408847184987, "percentage": 93.35, "elapsed_time": "4:23:53", "remaining_time": "0:18:47", "throughput": 4079.32, "total_tokens": 64591824} +{"current_steps": 111430, "total_steps": 119360, "loss": 0.3847, "lr": 1.338890886396932e-07, "epoch": 18.671246648793566, "percentage": 93.36, "elapsed_time": "4:23:54", "remaining_time": "0:18:46", "throughput": 4079.32, "total_tokens": 64594576} +{"current_steps": 111435, "total_steps": 119360, "loss": 0.4088, "lr": 1.3372108074472368e-07, "epoch": 18.672084450402146, "percentage": 93.36, "elapsed_time": "4:23:55", "remaining_time": "0:18:46", "throughput": 4079.33, "total_tokens": 64597328} +{"current_steps": 111440, "total_steps": 119360, "loss": 0.1898, "lr": 1.3355317689784432e-07, "epoch": 18.672922252010725, "percentage": 93.36, "elapsed_time": "4:23:55", "remaining_time": "0:18:45", "throughput": 4079.33, "total_tokens": 64600176} +{"current_steps": 111445, "total_steps": 119360, "loss": 0.125, "lr": 1.3338537710264442e-07, "epoch": 18.673760053619304, "percentage": 93.37, "elapsed_time": "4:23:56", "remaining_time": "0:18:44", "throughput": 4079.34, "total_tokens": 64602832} +{"current_steps": 111450, "total_steps": 119360, "loss": 0.4026, "lr": 1.3321768136271285e-07, "epoch": 18.674597855227884, "percentage": 93.37, "elapsed_time": "4:23:57", "remaining_time": "0:18:44", "throughput": 4079.34, "total_tokens": 64605520} +{"current_steps": 111455, "total_steps": 119360, "loss": 0.3512, "lr": 1.3305008968163446e-07, "epoch": 18.675435656836463, "percentage": 93.38, "elapsed_time": "4:23:57", "remaining_time": "0:18:43", "throughput": 4079.35, "total_tokens": 64608464} +{"current_steps": 111460, "total_steps": 119360, "loss": 0.185, "lr": 1.3288260206299307e-07, "epoch": 18.67627345844504, "percentage": 93.38, "elapsed_time": "4:23:58", "remaining_time": "0:18:42", "throughput": 4079.37, "total_tokens": 64611568} +{"current_steps": 111465, "total_steps": 119360, "loss": 0.4609, "lr": 1.3271521851036806e-07, "epoch": 18.677111260053618, "percentage": 93.39, "elapsed_time": "4:23:59", "remaining_time": "0:18:41", "throughput": 4079.37, "total_tokens": 64614352} +{"current_steps": 111470, "total_steps": 119360, "loss": 0.3579, "lr": 1.3254793902734042e-07, "epoch": 18.677949061662197, "percentage": 93.39, "elapsed_time": "4:23:59", "remaining_time": "0:18:41", "throughput": 4079.38, "total_tokens": 64617296} +{"current_steps": 111475, "total_steps": 119360, "loss": 0.3788, "lr": 1.3238076361748674e-07, "epoch": 18.678786863270776, "percentage": 93.39, "elapsed_time": "4:24:00", "remaining_time": "0:18:40", "throughput": 4079.4, "total_tokens": 64620432} +{"current_steps": 111480, "total_steps": 119360, "loss": 0.3771, "lr": 1.3221369228438085e-07, "epoch": 18.679624664879356, "percentage": 93.4, "elapsed_time": "4:24:01", "remaining_time": "0:18:39", "throughput": 4079.41, "total_tokens": 64623312} +{"current_steps": 111485, "total_steps": 119360, "loss": 0.564, "lr": 1.3204672503159377e-07, "epoch": 18.680462466487935, "percentage": 93.4, "elapsed_time": "4:24:01", "remaining_time": "0:18:39", "throughput": 4079.41, "total_tokens": 64625936} +{"current_steps": 111490, "total_steps": 119360, "loss": 0.2379, "lr": 1.318798618626982e-07, "epoch": 18.681300268096514, "percentage": 93.41, "elapsed_time": "4:24:02", "remaining_time": "0:18:38", "throughput": 4079.41, "total_tokens": 64628688} +{"current_steps": 111495, "total_steps": 119360, "loss": 0.5721, "lr": 1.317131027812596e-07, "epoch": 18.682138069705093, "percentage": 93.41, "elapsed_time": "4:24:03", "remaining_time": "0:18:37", "throughput": 4079.43, "total_tokens": 64631600} +{"current_steps": 111500, "total_steps": 119360, "loss": 0.46, "lr": 1.3154644779084402e-07, "epoch": 18.682975871313673, "percentage": 93.41, "elapsed_time": "4:24:03", "remaining_time": "0:18:36", "throughput": 4079.44, "total_tokens": 64634576} +{"current_steps": 111505, "total_steps": 119360, "loss": 0.5525, "lr": 1.3137989689501585e-07, "epoch": 18.683813672922252, "percentage": 93.42, "elapsed_time": "4:24:04", "remaining_time": "0:18:36", "throughput": 4079.44, "total_tokens": 64637392} +{"current_steps": 111510, "total_steps": 119360, "loss": 0.3904, "lr": 1.3121345009733498e-07, "epoch": 18.68465147453083, "percentage": 93.42, "elapsed_time": "4:24:05", "remaining_time": "0:18:35", "throughput": 4079.46, "total_tokens": 64640432} +{"current_steps": 111515, "total_steps": 119360, "loss": 0.2212, "lr": 1.3104710740136083e-07, "epoch": 18.68548927613941, "percentage": 93.43, "elapsed_time": "4:24:05", "remaining_time": "0:18:34", "throughput": 4079.46, "total_tokens": 64643152} +{"current_steps": 111520, "total_steps": 119360, "loss": 0.2086, "lr": 1.3088086881065054e-07, "epoch": 18.68632707774799, "percentage": 93.43, "elapsed_time": "4:24:06", "remaining_time": "0:18:34", "throughput": 4079.48, "total_tokens": 64646096} +{"current_steps": 111525, "total_steps": 119360, "loss": 0.306, "lr": 1.3071473432875737e-07, "epoch": 18.68716487935657, "percentage": 93.44, "elapsed_time": "4:24:07", "remaining_time": "0:18:33", "throughput": 4079.49, "total_tokens": 64649264} +{"current_steps": 111530, "total_steps": 119360, "loss": 0.2311, "lr": 1.3054870395923402e-07, "epoch": 18.68800268096515, "percentage": 93.44, "elapsed_time": "4:24:08", "remaining_time": "0:18:32", "throughput": 4079.5, "total_tokens": 64652304} +{"current_steps": 111535, "total_steps": 119360, "loss": 0.4404, "lr": 1.3038277770563157e-07, "epoch": 18.688840482573728, "percentage": 93.44, "elapsed_time": "4:24:08", "remaining_time": "0:18:31", "throughput": 4079.51, "total_tokens": 64655120} +{"current_steps": 111540, "total_steps": 119360, "loss": 0.2509, "lr": 1.302169555714955e-07, "epoch": 18.689678284182307, "percentage": 93.45, "elapsed_time": "4:24:09", "remaining_time": "0:18:31", "throughput": 4079.52, "total_tokens": 64658064} +{"current_steps": 111545, "total_steps": 119360, "loss": 0.5005, "lr": 1.3005123756037298e-07, "epoch": 18.690516085790886, "percentage": 93.45, "elapsed_time": "4:24:10", "remaining_time": "0:18:30", "throughput": 4079.53, "total_tokens": 64661072} +{"current_steps": 111550, "total_steps": 119360, "loss": 0.3389, "lr": 1.2988562367580726e-07, "epoch": 18.691353887399465, "percentage": 93.46, "elapsed_time": "4:24:10", "remaining_time": "0:18:29", "throughput": 4079.54, "total_tokens": 64664240} +{"current_steps": 111555, "total_steps": 119360, "loss": 0.4443, "lr": 1.2972011392133887e-07, "epoch": 18.69219168900804, "percentage": 93.46, "elapsed_time": "4:24:11", "remaining_time": "0:18:29", "throughput": 4079.55, "total_tokens": 64667024} +{"current_steps": 111560, "total_steps": 119360, "loss": 0.5035, "lr": 1.2955470830050664e-07, "epoch": 18.69302949061662, "percentage": 93.47, "elapsed_time": "4:24:12", "remaining_time": "0:18:28", "throughput": 4079.55, "total_tokens": 64669808} +{"current_steps": 111565, "total_steps": 119360, "loss": 0.4225, "lr": 1.2938940681684775e-07, "epoch": 18.6938672922252, "percentage": 93.47, "elapsed_time": "4:24:12", "remaining_time": "0:18:27", "throughput": 4079.56, "total_tokens": 64672624} +{"current_steps": 111570, "total_steps": 119360, "loss": 0.2978, "lr": 1.2922420947389546e-07, "epoch": 18.69470509383378, "percentage": 93.47, "elapsed_time": "4:24:13", "remaining_time": "0:18:26", "throughput": 4079.57, "total_tokens": 64675248} +{"current_steps": 111575, "total_steps": 119360, "loss": 0.3379, "lr": 1.2905911627518307e-07, "epoch": 18.695542895442358, "percentage": 93.48, "elapsed_time": "4:24:14", "remaining_time": "0:18:26", "throughput": 4079.57, "total_tokens": 64678096} +{"current_steps": 111580, "total_steps": 119360, "loss": 0.5926, "lr": 1.2889412722424054e-07, "epoch": 18.696380697050937, "percentage": 93.48, "elapsed_time": "4:24:14", "remaining_time": "0:18:25", "throughput": 4079.58, "total_tokens": 64681104} +{"current_steps": 111585, "total_steps": 119360, "loss": 0.3166, "lr": 1.287292423245945e-07, "epoch": 18.697218498659517, "percentage": 93.49, "elapsed_time": "4:24:15", "remaining_time": "0:18:24", "throughput": 4079.59, "total_tokens": 64683824} +{"current_steps": 111590, "total_steps": 119360, "loss": 0.3525, "lr": 1.28564461579771e-07, "epoch": 18.698056300268096, "percentage": 93.49, "elapsed_time": "4:24:16", "remaining_time": "0:18:24", "throughput": 4079.61, "total_tokens": 64686960} +{"current_steps": 111595, "total_steps": 119360, "loss": 0.314, "lr": 1.2839978499329385e-07, "epoch": 18.698894101876675, "percentage": 93.49, "elapsed_time": "4:24:16", "remaining_time": "0:18:23", "throughput": 4079.62, "total_tokens": 64689872} +{"current_steps": 111600, "total_steps": 119360, "loss": 0.2351, "lr": 1.2823521256868366e-07, "epoch": 18.699731903485254, "percentage": 93.5, "elapsed_time": "4:24:17", "remaining_time": "0:18:22", "throughput": 4079.63, "total_tokens": 64692912} +{"current_steps": 111605, "total_steps": 119360, "loss": 0.2711, "lr": 1.2807074430945865e-07, "epoch": 18.700569705093834, "percentage": 93.5, "elapsed_time": "4:24:18", "remaining_time": "0:18:21", "throughput": 4079.64, "total_tokens": 64695728} +{"current_steps": 111610, "total_steps": 119360, "loss": 0.3953, "lr": 1.2790638021913604e-07, "epoch": 18.701407506702413, "percentage": 93.51, "elapsed_time": "4:24:18", "remaining_time": "0:18:21", "throughput": 4079.65, "total_tokens": 64698832} +{"current_steps": 111615, "total_steps": 119360, "loss": 0.4563, "lr": 1.2774212030123024e-07, "epoch": 18.702245308310992, "percentage": 93.51, "elapsed_time": "4:24:19", "remaining_time": "0:18:20", "throughput": 4079.66, "total_tokens": 64701616} +{"current_steps": 111620, "total_steps": 119360, "loss": 0.3658, "lr": 1.2757796455925288e-07, "epoch": 18.70308310991957, "percentage": 93.52, "elapsed_time": "4:24:20", "remaining_time": "0:18:19", "throughput": 4079.67, "total_tokens": 64704528} +{"current_steps": 111625, "total_steps": 119360, "loss": 0.4058, "lr": 1.2741391299671503e-07, "epoch": 18.70392091152815, "percentage": 93.52, "elapsed_time": "4:24:20", "remaining_time": "0:18:19", "throughput": 4079.67, "total_tokens": 64706992} +{"current_steps": 111630, "total_steps": 119360, "loss": 0.2419, "lr": 1.2724996561712167e-07, "epoch": 18.70475871313673, "percentage": 93.52, "elapsed_time": "4:24:21", "remaining_time": "0:18:18", "throughput": 4079.67, "total_tokens": 64709776} +{"current_steps": 111635, "total_steps": 119360, "loss": 0.2989, "lr": 1.270861224239811e-07, "epoch": 18.70559651474531, "percentage": 93.53, "elapsed_time": "4:24:22", "remaining_time": "0:18:17", "throughput": 4079.68, "total_tokens": 64712432} +{"current_steps": 111640, "total_steps": 119360, "loss": 0.37, "lr": 1.2692238342079556e-07, "epoch": 18.70643431635389, "percentage": 93.53, "elapsed_time": "4:24:22", "remaining_time": "0:18:16", "throughput": 4079.69, "total_tokens": 64715184} +{"current_steps": 111645, "total_steps": 119360, "loss": 0.31, "lr": 1.2675874861106607e-07, "epoch": 18.707272117962468, "percentage": 93.54, "elapsed_time": "4:24:23", "remaining_time": "0:18:16", "throughput": 4079.7, "total_tokens": 64718192} +{"current_steps": 111650, "total_steps": 119360, "loss": 0.1606, "lr": 1.265952179982899e-07, "epoch": 18.708109919571047, "percentage": 93.54, "elapsed_time": "4:24:24", "remaining_time": "0:18:15", "throughput": 4079.71, "total_tokens": 64721040} +{"current_steps": 111655, "total_steps": 119360, "loss": 0.1519, "lr": 1.2643179158596642e-07, "epoch": 18.708947721179626, "percentage": 93.54, "elapsed_time": "4:24:24", "remaining_time": "0:18:14", "throughput": 4079.73, "total_tokens": 64724240} +{"current_steps": 111660, "total_steps": 119360, "loss": 0.3512, "lr": 1.2626846937758729e-07, "epoch": 18.709785522788202, "percentage": 93.55, "elapsed_time": "4:24:25", "remaining_time": "0:18:14", "throughput": 4079.73, "total_tokens": 64727056} +{"current_steps": 111665, "total_steps": 119360, "loss": 0.3113, "lr": 1.2610525137664642e-07, "epoch": 18.71062332439678, "percentage": 93.55, "elapsed_time": "4:24:26", "remaining_time": "0:18:13", "throughput": 4079.74, "total_tokens": 64729776} +{"current_steps": 111670, "total_steps": 119360, "loss": 0.4377, "lr": 1.259421375866321e-07, "epoch": 18.71146112600536, "percentage": 93.56, "elapsed_time": "4:24:26", "remaining_time": "0:18:12", "throughput": 4079.74, "total_tokens": 64732400} +{"current_steps": 111675, "total_steps": 119360, "loss": 0.3968, "lr": 1.257791280110332e-07, "epoch": 18.71229892761394, "percentage": 93.56, "elapsed_time": "4:24:27", "remaining_time": "0:18:11", "throughput": 4079.75, "total_tokens": 64735216} +{"current_steps": 111680, "total_steps": 119360, "loss": 0.2404, "lr": 1.2561622265333474e-07, "epoch": 18.71313672922252, "percentage": 93.57, "elapsed_time": "4:24:28", "remaining_time": "0:18:11", "throughput": 4079.76, "total_tokens": 64738320} +{"current_steps": 111685, "total_steps": 119360, "loss": 0.1165, "lr": 1.2545342151702001e-07, "epoch": 18.7139745308311, "percentage": 93.57, "elapsed_time": "4:24:28", "remaining_time": "0:18:10", "throughput": 4079.77, "total_tokens": 64741008} +{"current_steps": 111690, "total_steps": 119360, "loss": 0.1328, "lr": 1.25290724605569e-07, "epoch": 18.714812332439678, "percentage": 93.57, "elapsed_time": "4:24:29", "remaining_time": "0:18:09", "throughput": 4079.78, "total_tokens": 64743824} +{"current_steps": 111695, "total_steps": 119360, "loss": 0.3834, "lr": 1.251281319224612e-07, "epoch": 18.715650134048257, "percentage": 93.58, "elapsed_time": "4:24:30", "remaining_time": "0:18:09", "throughput": 4079.79, "total_tokens": 64746832} +{"current_steps": 111700, "total_steps": 119360, "loss": 0.4856, "lr": 1.2496564347117323e-07, "epoch": 18.716487935656836, "percentage": 93.58, "elapsed_time": "4:24:30", "remaining_time": "0:18:08", "throughput": 4079.8, "total_tokens": 64749616} +{"current_steps": 111705, "total_steps": 119360, "loss": 0.1679, "lr": 1.24803259255179e-07, "epoch": 18.717325737265416, "percentage": 93.59, "elapsed_time": "4:24:31", "remaining_time": "0:18:07", "throughput": 4079.81, "total_tokens": 64752528} +{"current_steps": 111710, "total_steps": 119360, "loss": 0.3585, "lr": 1.2464097927795017e-07, "epoch": 18.718163538873995, "percentage": 93.59, "elapsed_time": "4:24:32", "remaining_time": "0:18:06", "throughput": 4079.81, "total_tokens": 64755248} +{"current_steps": 111715, "total_steps": 119360, "loss": 0.1889, "lr": 1.2447880354295782e-07, "epoch": 18.719001340482574, "percentage": 93.6, "elapsed_time": "4:24:32", "remaining_time": "0:18:06", "throughput": 4079.82, "total_tokens": 64758160} +{"current_steps": 111720, "total_steps": 119360, "loss": 0.2197, "lr": 1.243167320536681e-07, "epoch": 18.719839142091153, "percentage": 93.6, "elapsed_time": "4:24:33", "remaining_time": "0:18:05", "throughput": 4079.84, "total_tokens": 64761520} +{"current_steps": 111725, "total_steps": 119360, "loss": 0.4124, "lr": 1.241547648135466e-07, "epoch": 18.720676943699733, "percentage": 93.6, "elapsed_time": "4:24:34", "remaining_time": "0:18:04", "throughput": 4079.85, "total_tokens": 64764432} +{"current_steps": 111730, "total_steps": 119360, "loss": 0.3255, "lr": 1.2399290182605716e-07, "epoch": 18.721514745308312, "percentage": 93.61, "elapsed_time": "4:24:34", "remaining_time": "0:18:04", "throughput": 4079.85, "total_tokens": 64767024} +{"current_steps": 111735, "total_steps": 119360, "loss": 0.484, "lr": 1.2383114309465983e-07, "epoch": 18.72235254691689, "percentage": 93.61, "elapsed_time": "4:24:35", "remaining_time": "0:18:03", "throughput": 4079.86, "total_tokens": 64770000} +{"current_steps": 111740, "total_steps": 119360, "loss": 0.533, "lr": 1.2366948862281347e-07, "epoch": 18.72319034852547, "percentage": 93.62, "elapsed_time": "4:24:36", "remaining_time": "0:18:02", "throughput": 4079.88, "total_tokens": 64773360} +{"current_steps": 111745, "total_steps": 119360, "loss": 0.2583, "lr": 1.2350793841397535e-07, "epoch": 18.72402815013405, "percentage": 93.62, "elapsed_time": "4:24:37", "remaining_time": "0:18:01", "throughput": 4079.89, "total_tokens": 64776432} +{"current_steps": 111750, "total_steps": 119360, "loss": 0.563, "lr": 1.2334649247159826e-07, "epoch": 18.72486595174263, "percentage": 93.62, "elapsed_time": "4:24:37", "remaining_time": "0:18:01", "throughput": 4079.9, "total_tokens": 64779184} +{"current_steps": 111755, "total_steps": 119360, "loss": 0.3474, "lr": 1.2318515079913386e-07, "epoch": 18.725703753351205, "percentage": 93.63, "elapsed_time": "4:24:38", "remaining_time": "0:18:00", "throughput": 4079.91, "total_tokens": 64782064} +{"current_steps": 111760, "total_steps": 119360, "loss": 0.3805, "lr": 1.230239134000344e-07, "epoch": 18.726541554959784, "percentage": 93.63, "elapsed_time": "4:24:38", "remaining_time": "0:17:59", "throughput": 4079.91, "total_tokens": 64784784} +{"current_steps": 111765, "total_steps": 119360, "loss": 0.3216, "lr": 1.2286278027774489e-07, "epoch": 18.727379356568363, "percentage": 93.64, "elapsed_time": "4:24:39", "remaining_time": "0:17:59", "throughput": 4079.92, "total_tokens": 64787920} +{"current_steps": 111770, "total_steps": 119360, "loss": 0.3604, "lr": 1.227017514357115e-07, "epoch": 18.728217158176943, "percentage": 93.64, "elapsed_time": "4:24:40", "remaining_time": "0:17:58", "throughput": 4079.93, "total_tokens": 64790736} +{"current_steps": 111775, "total_steps": 119360, "loss": 0.5326, "lr": 1.2254082687737702e-07, "epoch": 18.729054959785522, "percentage": 93.65, "elapsed_time": "4:24:41", "remaining_time": "0:17:57", "throughput": 4079.95, "total_tokens": 64793968} +{"current_steps": 111780, "total_steps": 119360, "loss": 0.2094, "lr": 1.223800066061831e-07, "epoch": 18.7298927613941, "percentage": 93.65, "elapsed_time": "4:24:41", "remaining_time": "0:17:56", "throughput": 4079.96, "total_tokens": 64796816} +{"current_steps": 111785, "total_steps": 119360, "loss": 0.2234, "lr": 1.2221929062556704e-07, "epoch": 18.73073056300268, "percentage": 93.65, "elapsed_time": "4:24:42", "remaining_time": "0:17:56", "throughput": 4079.96, "total_tokens": 64799824} +{"current_steps": 111790, "total_steps": 119360, "loss": 0.35, "lr": 1.220586789389666e-07, "epoch": 18.73156836461126, "percentage": 93.66, "elapsed_time": "4:24:43", "remaining_time": "0:17:55", "throughput": 4079.97, "total_tokens": 64802640} +{"current_steps": 111795, "total_steps": 119360, "loss": 0.5925, "lr": 1.2189817154981354e-07, "epoch": 18.73240616621984, "percentage": 93.66, "elapsed_time": "4:24:43", "remaining_time": "0:17:54", "throughput": 4079.98, "total_tokens": 64805552} +{"current_steps": 111800, "total_steps": 119360, "loss": 0.2179, "lr": 1.2173776846154228e-07, "epoch": 18.733243967828418, "percentage": 93.67, "elapsed_time": "4:24:44", "remaining_time": "0:17:54", "throughput": 4079.99, "total_tokens": 64808240} +{"current_steps": 111805, "total_steps": 119360, "loss": 0.1528, "lr": 1.2157746967758177e-07, "epoch": 18.734081769436997, "percentage": 93.67, "elapsed_time": "4:24:45", "remaining_time": "0:17:53", "throughput": 4080.0, "total_tokens": 64811248} +{"current_steps": 111810, "total_steps": 119360, "loss": 0.5978, "lr": 1.214172752013587e-07, "epoch": 18.734919571045577, "percentage": 93.67, "elapsed_time": "4:24:45", "remaining_time": "0:17:52", "throughput": 4080.01, "total_tokens": 64814128} +{"current_steps": 111815, "total_steps": 119360, "loss": 0.3629, "lr": 1.2125718503629814e-07, "epoch": 18.735757372654156, "percentage": 93.68, "elapsed_time": "4:24:46", "remaining_time": "0:17:51", "throughput": 4080.02, "total_tokens": 64816976} +{"current_steps": 111820, "total_steps": 119360, "loss": 0.5228, "lr": 1.2109719918582452e-07, "epoch": 18.736595174262735, "percentage": 93.68, "elapsed_time": "4:24:47", "remaining_time": "0:17:51", "throughput": 4080.03, "total_tokens": 64820048} +{"current_steps": 111825, "total_steps": 119360, "loss": 0.2612, "lr": 1.2093731765335736e-07, "epoch": 18.737432975871315, "percentage": 93.69, "elapsed_time": "4:24:47", "remaining_time": "0:17:50", "throughput": 4080.04, "total_tokens": 64822928} +{"current_steps": 111830, "total_steps": 119360, "loss": 0.3759, "lr": 1.207775404423156e-07, "epoch": 18.738270777479894, "percentage": 93.69, "elapsed_time": "4:24:48", "remaining_time": "0:17:49", "throughput": 4080.05, "total_tokens": 64825648} +{"current_steps": 111835, "total_steps": 119360, "loss": 0.3811, "lr": 1.2061786755611482e-07, "epoch": 18.739108579088473, "percentage": 93.7, "elapsed_time": "4:24:49", "remaining_time": "0:17:49", "throughput": 4080.06, "total_tokens": 64828560} +{"current_steps": 111840, "total_steps": 119360, "loss": 0.5115, "lr": 1.2045829899817007e-07, "epoch": 18.739946380697052, "percentage": 93.7, "elapsed_time": "4:24:49", "remaining_time": "0:17:48", "throughput": 4080.07, "total_tokens": 64831440} +{"current_steps": 111845, "total_steps": 119360, "loss": 0.3665, "lr": 1.202988347718925e-07, "epoch": 18.74078418230563, "percentage": 93.7, "elapsed_time": "4:24:50", "remaining_time": "0:17:47", "throughput": 4080.09, "total_tokens": 64834736} +{"current_steps": 111850, "total_steps": 119360, "loss": 0.3752, "lr": 1.2013947488069222e-07, "epoch": 18.741621983914207, "percentage": 93.71, "elapsed_time": "4:24:51", "remaining_time": "0:17:46", "throughput": 4080.1, "total_tokens": 64837936} +{"current_steps": 111855, "total_steps": 119360, "loss": 0.4726, "lr": 1.1998021932797533e-07, "epoch": 18.742459785522787, "percentage": 93.71, "elapsed_time": "4:24:51", "remaining_time": "0:17:46", "throughput": 4080.11, "total_tokens": 64840880} +{"current_steps": 111860, "total_steps": 119360, "loss": 0.281, "lr": 1.1982106811714855e-07, "epoch": 18.743297587131366, "percentage": 93.72, "elapsed_time": "4:24:52", "remaining_time": "0:17:45", "throughput": 4080.13, "total_tokens": 64843984} +{"current_steps": 111865, "total_steps": 119360, "loss": 0.2853, "lr": 1.1966202125161418e-07, "epoch": 18.744135388739945, "percentage": 93.72, "elapsed_time": "4:24:53", "remaining_time": "0:17:44", "throughput": 4080.13, "total_tokens": 64846960} +{"current_steps": 111870, "total_steps": 119360, "loss": 0.4791, "lr": 1.1950307873477228e-07, "epoch": 18.744973190348524, "percentage": 93.72, "elapsed_time": "4:24:54", "remaining_time": "0:17:44", "throughput": 4080.14, "total_tokens": 64849808} +{"current_steps": 111875, "total_steps": 119360, "loss": 0.3068, "lr": 1.1934424057002126e-07, "epoch": 18.745810991957104, "percentage": 93.73, "elapsed_time": "4:24:54", "remaining_time": "0:17:43", "throughput": 4080.14, "total_tokens": 64852528} +{"current_steps": 111880, "total_steps": 119360, "loss": 0.48, "lr": 1.1918550676075891e-07, "epoch": 18.746648793565683, "percentage": 93.73, "elapsed_time": "4:24:55", "remaining_time": "0:17:42", "throughput": 4080.15, "total_tokens": 64855600} +{"current_steps": 111885, "total_steps": 119360, "loss": 0.4784, "lr": 1.1902687731037754e-07, "epoch": 18.747486595174262, "percentage": 93.74, "elapsed_time": "4:24:56", "remaining_time": "0:17:42", "throughput": 4080.17, "total_tokens": 64858736} +{"current_steps": 111890, "total_steps": 119360, "loss": 0.3187, "lr": 1.1886835222226945e-07, "epoch": 18.74832439678284, "percentage": 93.74, "elapsed_time": "4:24:56", "remaining_time": "0:17:41", "throughput": 4080.18, "total_tokens": 64861616} +{"current_steps": 111895, "total_steps": 119360, "loss": 0.1645, "lr": 1.1870993149982413e-07, "epoch": 18.74916219839142, "percentage": 93.75, "elapsed_time": "4:24:57", "remaining_time": "0:17:40", "throughput": 4080.18, "total_tokens": 64864240} +{"current_steps": 111900, "total_steps": 119360, "loss": 0.178, "lr": 1.1855161514642833e-07, "epoch": 18.75, "percentage": 93.75, "elapsed_time": "4:24:58", "remaining_time": "0:17:39", "throughput": 4080.19, "total_tokens": 64867152} +{"current_steps": 111905, "total_steps": 119360, "loss": 0.2804, "lr": 1.1839340316546766e-07, "epoch": 18.75083780160858, "percentage": 93.75, "elapsed_time": "4:24:58", "remaining_time": "0:17:39", "throughput": 4080.2, "total_tokens": 64870416} +{"current_steps": 111910, "total_steps": 119360, "loss": 0.2485, "lr": 1.1823529556032554e-07, "epoch": 18.75167560321716, "percentage": 93.76, "elapsed_time": "4:24:59", "remaining_time": "0:17:38", "throughput": 4080.2, "total_tokens": 64873168} +{"current_steps": 111915, "total_steps": 119360, "loss": 0.415, "lr": 1.1807729233438148e-07, "epoch": 18.752513404825738, "percentage": 93.76, "elapsed_time": "4:25:00", "remaining_time": "0:17:37", "throughput": 4080.21, "total_tokens": 64876144} +{"current_steps": 111920, "total_steps": 119360, "loss": 0.3972, "lr": 1.1791939349101333e-07, "epoch": 18.753351206434317, "percentage": 93.77, "elapsed_time": "4:25:00", "remaining_time": "0:17:37", "throughput": 4080.22, "total_tokens": 64878864} +{"current_steps": 111925, "total_steps": 119360, "loss": 0.4049, "lr": 1.1776159903359896e-07, "epoch": 18.754189008042896, "percentage": 93.77, "elapsed_time": "4:25:01", "remaining_time": "0:17:36", "throughput": 4080.23, "total_tokens": 64881840} +{"current_steps": 111930, "total_steps": 119360, "loss": 0.542, "lr": 1.1760390896551121e-07, "epoch": 18.755026809651476, "percentage": 93.78, "elapsed_time": "4:25:02", "remaining_time": "0:17:35", "throughput": 4080.25, "total_tokens": 64884912} +{"current_steps": 111935, "total_steps": 119360, "loss": 0.4992, "lr": 1.1744632329012129e-07, "epoch": 18.755864611260055, "percentage": 93.78, "elapsed_time": "4:25:02", "remaining_time": "0:17:34", "throughput": 4080.25, "total_tokens": 64887696} +{"current_steps": 111940, "total_steps": 119360, "loss": 0.5142, "lr": 1.1728884201079927e-07, "epoch": 18.756702412868634, "percentage": 93.78, "elapsed_time": "4:25:03", "remaining_time": "0:17:34", "throughput": 4080.27, "total_tokens": 64890864} +{"current_steps": 111945, "total_steps": 119360, "loss": 0.3057, "lr": 1.1713146513091245e-07, "epoch": 18.757540214477213, "percentage": 93.79, "elapsed_time": "4:25:04", "remaining_time": "0:17:33", "throughput": 4080.28, "total_tokens": 64893744} +{"current_steps": 111950, "total_steps": 119360, "loss": 0.274, "lr": 1.1697419265382537e-07, "epoch": 18.758378016085793, "percentage": 93.79, "elapsed_time": "4:25:04", "remaining_time": "0:17:32", "throughput": 4080.28, "total_tokens": 64896720} +{"current_steps": 111955, "total_steps": 119360, "loss": 0.3314, "lr": 1.1681702458290145e-07, "epoch": 18.75921581769437, "percentage": 93.8, "elapsed_time": "4:25:05", "remaining_time": "0:17:32", "throughput": 4080.29, "total_tokens": 64899568} +{"current_steps": 111960, "total_steps": 119360, "loss": 0.2396, "lr": 1.1665996092149966e-07, "epoch": 18.760053619302948, "percentage": 93.8, "elapsed_time": "4:25:06", "remaining_time": "0:17:31", "throughput": 4080.3, "total_tokens": 64902544} +{"current_steps": 111965, "total_steps": 119360, "loss": 0.4622, "lr": 1.1650300167297956e-07, "epoch": 18.760891420911527, "percentage": 93.8, "elapsed_time": "4:25:06", "remaining_time": "0:17:30", "throughput": 4080.31, "total_tokens": 64905424} +{"current_steps": 111970, "total_steps": 119360, "loss": 0.1397, "lr": 1.1634614684069679e-07, "epoch": 18.761729222520106, "percentage": 93.81, "elapsed_time": "4:25:07", "remaining_time": "0:17:29", "throughput": 4080.32, "total_tokens": 64908496} +{"current_steps": 111975, "total_steps": 119360, "loss": 0.3531, "lr": 1.1618939642800531e-07, "epoch": 18.762567024128685, "percentage": 93.81, "elapsed_time": "4:25:08", "remaining_time": "0:17:29", "throughput": 4080.33, "total_tokens": 64911344} +{"current_steps": 111980, "total_steps": 119360, "loss": 0.4055, "lr": 1.1603275043825635e-07, "epoch": 18.763404825737265, "percentage": 93.82, "elapsed_time": "4:25:08", "remaining_time": "0:17:28", "throughput": 4080.34, "total_tokens": 64914064} +{"current_steps": 111985, "total_steps": 119360, "loss": 0.3357, "lr": 1.1587620887479944e-07, "epoch": 18.764242627345844, "percentage": 93.82, "elapsed_time": "4:25:09", "remaining_time": "0:17:27", "throughput": 4080.35, "total_tokens": 64917040} +{"current_steps": 111990, "total_steps": 119360, "loss": 0.0484, "lr": 1.1571977174098137e-07, "epoch": 18.765080428954423, "percentage": 93.83, "elapsed_time": "4:25:10", "remaining_time": "0:17:27", "throughput": 4080.37, "total_tokens": 64920176} +{"current_steps": 111995, "total_steps": 119360, "loss": 0.7239, "lr": 1.1556343904014778e-07, "epoch": 18.765918230563003, "percentage": 93.83, "elapsed_time": "4:25:11", "remaining_time": "0:17:26", "throughput": 4080.37, "total_tokens": 64922896} +{"current_steps": 112000, "total_steps": 119360, "loss": 0.3535, "lr": 1.1540721077563988e-07, "epoch": 18.766756032171582, "percentage": 93.83, "elapsed_time": "4:25:11", "remaining_time": "0:17:25", "throughput": 4080.38, "total_tokens": 64925712} +{"current_steps": 112005, "total_steps": 119360, "loss": 0.523, "lr": 1.1525108695079944e-07, "epoch": 18.76759383378016, "percentage": 93.84, "elapsed_time": "4:25:12", "remaining_time": "0:17:24", "throughput": 4080.38, "total_tokens": 64928464} +{"current_steps": 112010, "total_steps": 119360, "loss": 0.4471, "lr": 1.1509506756896438e-07, "epoch": 18.76843163538874, "percentage": 93.84, "elapsed_time": "4:25:13", "remaining_time": "0:17:24", "throughput": 4080.39, "total_tokens": 64931376} +{"current_steps": 112015, "total_steps": 119360, "loss": 0.5292, "lr": 1.1493915263347033e-07, "epoch": 18.76926943699732, "percentage": 93.85, "elapsed_time": "4:25:13", "remaining_time": "0:17:23", "throughput": 4080.4, "total_tokens": 64934352} +{"current_steps": 112020, "total_steps": 119360, "loss": 0.3341, "lr": 1.1478334214765019e-07, "epoch": 18.7701072386059, "percentage": 93.85, "elapsed_time": "4:25:14", "remaining_time": "0:17:22", "throughput": 4080.41, "total_tokens": 64937168} +{"current_steps": 112025, "total_steps": 119360, "loss": 0.3023, "lr": 1.146276361148363e-07, "epoch": 18.770945040214478, "percentage": 93.85, "elapsed_time": "4:25:14", "remaining_time": "0:17:22", "throughput": 4080.42, "total_tokens": 64939760} +{"current_steps": 112030, "total_steps": 119360, "loss": 0.359, "lr": 1.1447203453835876e-07, "epoch": 18.771782841823057, "percentage": 93.86, "elapsed_time": "4:25:15", "remaining_time": "0:17:21", "throughput": 4080.42, "total_tokens": 64942480} +{"current_steps": 112035, "total_steps": 119360, "loss": 0.2922, "lr": 1.1431653742154325e-07, "epoch": 18.772620643431637, "percentage": 93.86, "elapsed_time": "4:25:16", "remaining_time": "0:17:20", "throughput": 4080.43, "total_tokens": 64945488} +{"current_steps": 112040, "total_steps": 119360, "loss": 0.3299, "lr": 1.1416114476771434e-07, "epoch": 18.773458445040216, "percentage": 93.87, "elapsed_time": "4:25:16", "remaining_time": "0:17:19", "throughput": 4080.44, "total_tokens": 64948240} +{"current_steps": 112045, "total_steps": 119360, "loss": 0.2418, "lr": 1.1400585658019547e-07, "epoch": 18.774296246648795, "percentage": 93.87, "elapsed_time": "4:25:17", "remaining_time": "0:17:19", "throughput": 4080.45, "total_tokens": 64951344} +{"current_steps": 112050, "total_steps": 119360, "loss": 0.2952, "lr": 1.1385067286230623e-07, "epoch": 18.77513404825737, "percentage": 93.88, "elapsed_time": "4:25:18", "remaining_time": "0:17:18", "throughput": 4080.46, "total_tokens": 64954512} +{"current_steps": 112055, "total_steps": 119360, "loss": 0.3653, "lr": 1.1369559361736504e-07, "epoch": 18.77597184986595, "percentage": 93.88, "elapsed_time": "4:25:19", "remaining_time": "0:17:17", "throughput": 4080.47, "total_tokens": 64957136} +{"current_steps": 112060, "total_steps": 119360, "loss": 0.2364, "lr": 1.1354061884868817e-07, "epoch": 18.77680965147453, "percentage": 93.88, "elapsed_time": "4:25:19", "remaining_time": "0:17:17", "throughput": 4080.48, "total_tokens": 64960048} +{"current_steps": 112065, "total_steps": 119360, "loss": 0.2069, "lr": 1.133857485595874e-07, "epoch": 18.77764745308311, "percentage": 93.89, "elapsed_time": "4:25:20", "remaining_time": "0:17:16", "throughput": 4080.49, "total_tokens": 64962992} +{"current_steps": 112070, "total_steps": 119360, "loss": 0.2837, "lr": 1.1323098275337619e-07, "epoch": 18.778485254691688, "percentage": 93.89, "elapsed_time": "4:25:21", "remaining_time": "0:17:15", "throughput": 4080.5, "total_tokens": 64965936} +{"current_steps": 112075, "total_steps": 119360, "loss": 0.503, "lr": 1.13076321433363e-07, "epoch": 18.779323056300267, "percentage": 93.9, "elapsed_time": "4:25:21", "remaining_time": "0:17:14", "throughput": 4080.5, "total_tokens": 64968784} +{"current_steps": 112080, "total_steps": 119360, "loss": 0.3806, "lr": 1.1292176460285409e-07, "epoch": 18.780160857908847, "percentage": 93.9, "elapsed_time": "4:25:22", "remaining_time": "0:17:14", "throughput": 4080.52, "total_tokens": 64971824} +{"current_steps": 112085, "total_steps": 119360, "loss": 0.369, "lr": 1.1276731226515514e-07, "epoch": 18.780998659517426, "percentage": 93.9, "elapsed_time": "4:25:23", "remaining_time": "0:17:13", "throughput": 4080.53, "total_tokens": 64974640} +{"current_steps": 112090, "total_steps": 119360, "loss": 0.2958, "lr": 1.126129644235674e-07, "epoch": 18.781836461126005, "percentage": 93.91, "elapsed_time": "4:25:23", "remaining_time": "0:17:12", "throughput": 4080.54, "total_tokens": 64977424} +{"current_steps": 112095, "total_steps": 119360, "loss": 0.4985, "lr": 1.1245872108139155e-07, "epoch": 18.782674262734584, "percentage": 93.91, "elapsed_time": "4:25:24", "remaining_time": "0:17:12", "throughput": 4080.55, "total_tokens": 64980336} +{"current_steps": 112100, "total_steps": 119360, "loss": 0.2965, "lr": 1.1230458224192609e-07, "epoch": 18.783512064343164, "percentage": 93.92, "elapsed_time": "4:25:25", "remaining_time": "0:17:11", "throughput": 4080.55, "total_tokens": 64983120} +{"current_steps": 112105, "total_steps": 119360, "loss": 0.2385, "lr": 1.1215054790846614e-07, "epoch": 18.784349865951743, "percentage": 93.92, "elapsed_time": "4:25:25", "remaining_time": "0:17:10", "throughput": 4080.56, "total_tokens": 64986000} +{"current_steps": 112110, "total_steps": 119360, "loss": 0.2832, "lr": 1.1199661808430517e-07, "epoch": 18.785187667560322, "percentage": 93.93, "elapsed_time": "4:25:26", "remaining_time": "0:17:09", "throughput": 4080.58, "total_tokens": 64989136} +{"current_steps": 112115, "total_steps": 119360, "loss": 0.7917, "lr": 1.1184279277273446e-07, "epoch": 18.7860254691689, "percentage": 93.93, "elapsed_time": "4:25:27", "remaining_time": "0:17:09", "throughput": 4080.59, "total_tokens": 64992144} +{"current_steps": 112120, "total_steps": 119360, "loss": 0.1803, "lr": 1.1168907197704359e-07, "epoch": 18.78686327077748, "percentage": 93.93, "elapsed_time": "4:25:27", "remaining_time": "0:17:08", "throughput": 4080.6, "total_tokens": 64995088} +{"current_steps": 112125, "total_steps": 119360, "loss": 0.1426, "lr": 1.1153545570051827e-07, "epoch": 18.78770107238606, "percentage": 93.94, "elapsed_time": "4:25:28", "remaining_time": "0:17:07", "throughput": 4080.6, "total_tokens": 64997776} +{"current_steps": 112130, "total_steps": 119360, "loss": 0.3266, "lr": 1.1138194394644364e-07, "epoch": 18.78853887399464, "percentage": 93.94, "elapsed_time": "4:25:29", "remaining_time": "0:17:07", "throughput": 4080.61, "total_tokens": 65001040} +{"current_steps": 112135, "total_steps": 119360, "loss": 0.2769, "lr": 1.1122853671810263e-07, "epoch": 18.78937667560322, "percentage": 93.95, "elapsed_time": "4:25:29", "remaining_time": "0:17:06", "throughput": 4080.63, "total_tokens": 65004144} +{"current_steps": 112140, "total_steps": 119360, "loss": 0.1369, "lr": 1.1107523401877374e-07, "epoch": 18.790214477211798, "percentage": 93.95, "elapsed_time": "4:25:30", "remaining_time": "0:17:05", "throughput": 4080.64, "total_tokens": 65007152} +{"current_steps": 112145, "total_steps": 119360, "loss": 0.473, "lr": 1.1092203585173655e-07, "epoch": 18.791052278820374, "percentage": 93.96, "elapsed_time": "4:25:31", "remaining_time": "0:17:04", "throughput": 4080.65, "total_tokens": 65009968} +{"current_steps": 112150, "total_steps": 119360, "loss": 0.1803, "lr": 1.1076894222026513e-07, "epoch": 18.791890080428953, "percentage": 93.96, "elapsed_time": "4:25:31", "remaining_time": "0:17:04", "throughput": 4080.66, "total_tokens": 65012880} +{"current_steps": 112155, "total_steps": 119360, "loss": 0.2555, "lr": 1.1061595312763407e-07, "epoch": 18.792727882037532, "percentage": 93.96, "elapsed_time": "4:25:32", "remaining_time": "0:17:03", "throughput": 4080.66, "total_tokens": 65015728} +{"current_steps": 112160, "total_steps": 119360, "loss": 0.314, "lr": 1.1046306857711353e-07, "epoch": 18.79356568364611, "percentage": 93.97, "elapsed_time": "4:25:33", "remaining_time": "0:17:02", "throughput": 4080.68, "total_tokens": 65018608} +{"current_steps": 112165, "total_steps": 119360, "loss": 0.2796, "lr": 1.1031028857197312e-07, "epoch": 18.79440348525469, "percentage": 93.97, "elapsed_time": "4:25:33", "remaining_time": "0:17:02", "throughput": 4080.69, "total_tokens": 65021520} +{"current_steps": 112170, "total_steps": 119360, "loss": 0.2223, "lr": 1.1015761311547912e-07, "epoch": 18.79524128686327, "percentage": 93.98, "elapsed_time": "4:25:34", "remaining_time": "0:17:01", "throughput": 4080.69, "total_tokens": 65024272} +{"current_steps": 112175, "total_steps": 119360, "loss": 0.5133, "lr": 1.1000504221089613e-07, "epoch": 18.79607908847185, "percentage": 93.98, "elapsed_time": "4:25:35", "remaining_time": "0:17:00", "throughput": 4080.7, "total_tokens": 65026960} +{"current_steps": 112180, "total_steps": 119360, "loss": 0.2851, "lr": 1.0985257586148656e-07, "epoch": 18.79691689008043, "percentage": 93.98, "elapsed_time": "4:25:35", "remaining_time": "0:16:59", "throughput": 4080.7, "total_tokens": 65029840} +{"current_steps": 112185, "total_steps": 119360, "loss": 0.4068, "lr": 1.0970021407050946e-07, "epoch": 18.797754691689008, "percentage": 93.99, "elapsed_time": "4:25:36", "remaining_time": "0:16:59", "throughput": 4080.71, "total_tokens": 65032624} +{"current_steps": 112190, "total_steps": 119360, "loss": 0.2412, "lr": 1.0954795684122388e-07, "epoch": 18.798592493297587, "percentage": 93.99, "elapsed_time": "4:25:37", "remaining_time": "0:16:58", "throughput": 4080.72, "total_tokens": 65035376} +{"current_steps": 112195, "total_steps": 119360, "loss": 0.2535, "lr": 1.0939580417688389e-07, "epoch": 18.799430294906166, "percentage": 94.0, "elapsed_time": "4:25:37", "remaining_time": "0:16:57", "throughput": 4080.73, "total_tokens": 65038160} +{"current_steps": 112200, "total_steps": 119360, "loss": 0.2242, "lr": 1.0924375608074356e-07, "epoch": 18.800268096514746, "percentage": 94.0, "elapsed_time": "4:25:38", "remaining_time": "0:16:57", "throughput": 4080.73, "total_tokens": 65041104} +{"current_steps": 112205, "total_steps": 119360, "loss": 0.2822, "lr": 1.0909181255605417e-07, "epoch": 18.801105898123325, "percentage": 94.01, "elapsed_time": "4:25:39", "remaining_time": "0:16:56", "throughput": 4080.74, "total_tokens": 65044048} +{"current_steps": 112210, "total_steps": 119360, "loss": 0.1422, "lr": 1.0893997360606367e-07, "epoch": 18.801943699731904, "percentage": 94.01, "elapsed_time": "4:25:40", "remaining_time": "0:16:55", "throughput": 4080.76, "total_tokens": 65047408} +{"current_steps": 112215, "total_steps": 119360, "loss": 0.3714, "lr": 1.0878823923401894e-07, "epoch": 18.802781501340483, "percentage": 94.01, "elapsed_time": "4:25:40", "remaining_time": "0:16:54", "throughput": 4080.76, "total_tokens": 65050192} +{"current_steps": 112220, "total_steps": 119360, "loss": 0.303, "lr": 1.0863660944316456e-07, "epoch": 18.803619302949063, "percentage": 94.02, "elapsed_time": "4:25:41", "remaining_time": "0:16:54", "throughput": 4080.77, "total_tokens": 65053104} +{"current_steps": 112225, "total_steps": 119360, "loss": 0.2293, "lr": 1.0848508423674187e-07, "epoch": 18.804457104557642, "percentage": 94.02, "elapsed_time": "4:25:42", "remaining_time": "0:16:53", "throughput": 4080.78, "total_tokens": 65055856} +{"current_steps": 112230, "total_steps": 119360, "loss": 0.3613, "lr": 1.0833366361799158e-07, "epoch": 18.80529490616622, "percentage": 94.03, "elapsed_time": "4:25:42", "remaining_time": "0:16:52", "throughput": 4080.78, "total_tokens": 65058512} +{"current_steps": 112235, "total_steps": 119360, "loss": 0.2746, "lr": 1.0818234759015167e-07, "epoch": 18.8061327077748, "percentage": 94.03, "elapsed_time": "4:25:43", "remaining_time": "0:16:52", "throughput": 4080.79, "total_tokens": 65061264} +{"current_steps": 112240, "total_steps": 119360, "loss": 0.3469, "lr": 1.0803113615645567e-07, "epoch": 18.80697050938338, "percentage": 94.03, "elapsed_time": "4:25:43", "remaining_time": "0:16:51", "throughput": 4080.79, "total_tokens": 65064080} +{"current_steps": 112245, "total_steps": 119360, "loss": 0.3105, "lr": 1.0788002932013819e-07, "epoch": 18.80780831099196, "percentage": 94.04, "elapsed_time": "4:25:44", "remaining_time": "0:16:50", "throughput": 4080.8, "total_tokens": 65067024} +{"current_steps": 112250, "total_steps": 119360, "loss": 0.4298, "lr": 1.0772902708442945e-07, "epoch": 18.808646112600535, "percentage": 94.04, "elapsed_time": "4:25:45", "remaining_time": "0:16:49", "throughput": 4080.81, "total_tokens": 65070000} +{"current_steps": 112255, "total_steps": 119360, "loss": 0.2079, "lr": 1.0757812945255852e-07, "epoch": 18.809483914209114, "percentage": 94.05, "elapsed_time": "4:25:46", "remaining_time": "0:16:49", "throughput": 4080.82, "total_tokens": 65072848} +{"current_steps": 112260, "total_steps": 119360, "loss": 0.3784, "lr": 1.0742733642775172e-07, "epoch": 18.810321715817693, "percentage": 94.05, "elapsed_time": "4:25:46", "remaining_time": "0:16:48", "throughput": 4080.83, "total_tokens": 65075696} +{"current_steps": 112265, "total_steps": 119360, "loss": 0.1277, "lr": 1.0727664801323312e-07, "epoch": 18.811159517426272, "percentage": 94.06, "elapsed_time": "4:25:47", "remaining_time": "0:16:47", "throughput": 4080.84, "total_tokens": 65078608} +{"current_steps": 112270, "total_steps": 119360, "loss": 0.4501, "lr": 1.0712606421222405e-07, "epoch": 18.81199731903485, "percentage": 94.06, "elapsed_time": "4:25:48", "remaining_time": "0:16:47", "throughput": 4080.85, "total_tokens": 65081424} +{"current_steps": 112275, "total_steps": 119360, "loss": 0.2893, "lr": 1.0697558502794525e-07, "epoch": 18.81283512064343, "percentage": 94.06, "elapsed_time": "4:25:48", "remaining_time": "0:16:46", "throughput": 4080.85, "total_tokens": 65084464} +{"current_steps": 112280, "total_steps": 119360, "loss": 0.3934, "lr": 1.0682521046361417e-07, "epoch": 18.81367292225201, "percentage": 94.07, "elapsed_time": "4:25:49", "remaining_time": "0:16:45", "throughput": 4080.86, "total_tokens": 65087472} +{"current_steps": 112285, "total_steps": 119360, "loss": 0.4522, "lr": 1.0667494052244542e-07, "epoch": 18.81451072386059, "percentage": 94.07, "elapsed_time": "4:25:50", "remaining_time": "0:16:45", "throughput": 4080.87, "total_tokens": 65090192} +{"current_steps": 112290, "total_steps": 119360, "loss": 0.2646, "lr": 1.0652477520765148e-07, "epoch": 18.81534852546917, "percentage": 94.08, "elapsed_time": "4:25:50", "remaining_time": "0:16:44", "throughput": 4080.88, "total_tokens": 65093072} +{"current_steps": 112295, "total_steps": 119360, "loss": 0.435, "lr": 1.0637471452244474e-07, "epoch": 18.816186327077748, "percentage": 94.08, "elapsed_time": "4:25:51", "remaining_time": "0:16:43", "throughput": 4080.89, "total_tokens": 65096016} +{"current_steps": 112300, "total_steps": 119360, "loss": 0.517, "lr": 1.0622475847003266e-07, "epoch": 18.817024128686327, "percentage": 94.09, "elapsed_time": "4:25:52", "remaining_time": "0:16:42", "throughput": 4080.9, "total_tokens": 65098832} +{"current_steps": 112305, "total_steps": 119360, "loss": 0.2262, "lr": 1.06074907053621e-07, "epoch": 18.817861930294907, "percentage": 94.09, "elapsed_time": "4:25:52", "remaining_time": "0:16:42", "throughput": 4080.91, "total_tokens": 65101584} +{"current_steps": 112310, "total_steps": 119360, "loss": 0.3763, "lr": 1.0592516027641498e-07, "epoch": 18.818699731903486, "percentage": 94.09, "elapsed_time": "4:25:53", "remaining_time": "0:16:41", "throughput": 4080.91, "total_tokens": 65104368} +{"current_steps": 112315, "total_steps": 119360, "loss": 0.2285, "lr": 1.0577551814161591e-07, "epoch": 18.819537533512065, "percentage": 94.1, "elapsed_time": "4:25:54", "remaining_time": "0:16:40", "throughput": 4080.92, "total_tokens": 65107248} +{"current_steps": 112320, "total_steps": 119360, "loss": 0.5282, "lr": 1.0562598065242291e-07, "epoch": 18.820375335120644, "percentage": 94.1, "elapsed_time": "4:25:54", "remaining_time": "0:16:40", "throughput": 4080.93, "total_tokens": 65110224} +{"current_steps": 112325, "total_steps": 119360, "loss": 0.1962, "lr": 1.0547654781203398e-07, "epoch": 18.821213136729224, "percentage": 94.11, "elapsed_time": "4:25:55", "remaining_time": "0:16:39", "throughput": 4080.94, "total_tokens": 65113200} +{"current_steps": 112330, "total_steps": 119360, "loss": 0.2576, "lr": 1.0532721962364378e-07, "epoch": 18.822050938337803, "percentage": 94.11, "elapsed_time": "4:25:56", "remaining_time": "0:16:38", "throughput": 4080.96, "total_tokens": 65116080} +{"current_steps": 112335, "total_steps": 119360, "loss": 0.316, "lr": 1.0517799609044532e-07, "epoch": 18.822888739946382, "percentage": 94.11, "elapsed_time": "4:25:56", "remaining_time": "0:16:37", "throughput": 4080.97, "total_tokens": 65118928} +{"current_steps": 112340, "total_steps": 119360, "loss": 0.4285, "lr": 1.0502887721562937e-07, "epoch": 18.82372654155496, "percentage": 94.12, "elapsed_time": "4:25:57", "remaining_time": "0:16:37", "throughput": 4080.98, "total_tokens": 65122096} +{"current_steps": 112345, "total_steps": 119360, "loss": 0.4853, "lr": 1.048798630023845e-07, "epoch": 18.824564343163537, "percentage": 94.12, "elapsed_time": "4:25:58", "remaining_time": "0:16:36", "throughput": 4081.0, "total_tokens": 65125296} +{"current_steps": 112350, "total_steps": 119360, "loss": 0.3192, "lr": 1.0473095345389539e-07, "epoch": 18.825402144772116, "percentage": 94.13, "elapsed_time": "4:25:58", "remaining_time": "0:16:35", "throughput": 4081.01, "total_tokens": 65128496} +{"current_steps": 112355, "total_steps": 119360, "loss": 0.5667, "lr": 1.0458214857334837e-07, "epoch": 18.826239946380696, "percentage": 94.13, "elapsed_time": "4:25:59", "remaining_time": "0:16:35", "throughput": 4081.02, "total_tokens": 65131472} +{"current_steps": 112360, "total_steps": 119360, "loss": 0.5313, "lr": 1.044334483639231e-07, "epoch": 18.827077747989275, "percentage": 94.14, "elapsed_time": "4:26:00", "remaining_time": "0:16:34", "throughput": 4081.02, "total_tokens": 65134352} +{"current_steps": 112365, "total_steps": 119360, "loss": 0.3532, "lr": 1.0428485282879985e-07, "epoch": 18.827915549597854, "percentage": 94.14, "elapsed_time": "4:26:01", "remaining_time": "0:16:33", "throughput": 4081.04, "total_tokens": 65137552} +{"current_steps": 112370, "total_steps": 119360, "loss": 0.2547, "lr": 1.0413636197115551e-07, "epoch": 18.828753351206434, "percentage": 94.14, "elapsed_time": "4:26:01", "remaining_time": "0:16:32", "throughput": 4081.05, "total_tokens": 65140400} +{"current_steps": 112375, "total_steps": 119360, "loss": 0.1572, "lr": 1.0398797579416476e-07, "epoch": 18.829591152815013, "percentage": 94.15, "elapsed_time": "4:26:02", "remaining_time": "0:16:32", "throughput": 4081.06, "total_tokens": 65143344} +{"current_steps": 112380, "total_steps": 119360, "loss": 0.2635, "lr": 1.0383969430100116e-07, "epoch": 18.830428954423592, "percentage": 94.15, "elapsed_time": "4:26:03", "remaining_time": "0:16:31", "throughput": 4081.06, "total_tokens": 65146032} +{"current_steps": 112385, "total_steps": 119360, "loss": 0.4671, "lr": 1.0369151749483497e-07, "epoch": 18.83126675603217, "percentage": 94.16, "elapsed_time": "4:26:03", "remaining_time": "0:16:30", "throughput": 4081.07, "total_tokens": 65148816} +{"current_steps": 112390, "total_steps": 119360, "loss": 0.3337, "lr": 1.035434453788342e-07, "epoch": 18.83210455764075, "percentage": 94.16, "elapsed_time": "4:26:04", "remaining_time": "0:16:30", "throughput": 4081.08, "total_tokens": 65151568} +{"current_steps": 112395, "total_steps": 119360, "loss": 0.4212, "lr": 1.0339547795616468e-07, "epoch": 18.83294235924933, "percentage": 94.16, "elapsed_time": "4:26:04", "remaining_time": "0:16:29", "throughput": 4081.08, "total_tokens": 65154416} +{"current_steps": 112400, "total_steps": 119360, "loss": 0.4148, "lr": 1.032476152299905e-07, "epoch": 18.83378016085791, "percentage": 94.17, "elapsed_time": "4:26:05", "remaining_time": "0:16:28", "throughput": 4081.1, "total_tokens": 65157456} +{"current_steps": 112405, "total_steps": 119360, "loss": 0.2004, "lr": 1.0309985720347304e-07, "epoch": 18.83461796246649, "percentage": 94.17, "elapsed_time": "4:26:06", "remaining_time": "0:16:27", "throughput": 4081.12, "total_tokens": 65160656} +{"current_steps": 112410, "total_steps": 119360, "loss": 0.7227, "lr": 1.0295220387977089e-07, "epoch": 18.835455764075068, "percentage": 94.18, "elapsed_time": "4:26:07", "remaining_time": "0:16:27", "throughput": 4081.12, "total_tokens": 65163536} +{"current_steps": 112415, "total_steps": 119360, "loss": 0.6987, "lr": 1.0280465526204264e-07, "epoch": 18.836293565683647, "percentage": 94.18, "elapsed_time": "4:26:07", "remaining_time": "0:16:26", "throughput": 4081.14, "total_tokens": 65166736} +{"current_steps": 112420, "total_steps": 119360, "loss": 0.394, "lr": 1.0265721135344131e-07, "epoch": 18.837131367292226, "percentage": 94.19, "elapsed_time": "4:26:08", "remaining_time": "0:16:25", "throughput": 4081.14, "total_tokens": 65169424} +{"current_steps": 112425, "total_steps": 119360, "loss": 0.257, "lr": 1.0250987215712105e-07, "epoch": 18.837969168900806, "percentage": 94.19, "elapsed_time": "4:26:09", "remaining_time": "0:16:25", "throughput": 4081.15, "total_tokens": 65172144} +{"current_steps": 112430, "total_steps": 119360, "loss": 0.341, "lr": 1.02362637676231e-07, "epoch": 18.838806970509385, "percentage": 94.19, "elapsed_time": "4:26:09", "remaining_time": "0:16:24", "throughput": 4081.16, "total_tokens": 65175120} +{"current_steps": 112435, "total_steps": 119360, "loss": 0.3802, "lr": 1.0221550791392033e-07, "epoch": 18.839644772117964, "percentage": 94.2, "elapsed_time": "4:26:10", "remaining_time": "0:16:23", "throughput": 4081.17, "total_tokens": 65178032} +{"current_steps": 112440, "total_steps": 119360, "loss": 0.3618, "lr": 1.020684828733337e-07, "epoch": 18.84048257372654, "percentage": 94.2, "elapsed_time": "4:26:11", "remaining_time": "0:16:22", "throughput": 4081.17, "total_tokens": 65180784} +{"current_steps": 112445, "total_steps": 119360, "loss": 0.1458, "lr": 1.0192156255761643e-07, "epoch": 18.84132037533512, "percentage": 94.21, "elapsed_time": "4:26:11", "remaining_time": "0:16:22", "throughput": 4081.18, "total_tokens": 65183760} +{"current_steps": 112450, "total_steps": 119360, "loss": 0.2639, "lr": 1.0177474696990764e-07, "epoch": 18.8421581769437, "percentage": 94.21, "elapsed_time": "4:26:12", "remaining_time": "0:16:21", "throughput": 4081.19, "total_tokens": 65186448} +{"current_steps": 112455, "total_steps": 119360, "loss": 0.252, "lr": 1.0162803611334759e-07, "epoch": 18.842995978552278, "percentage": 94.21, "elapsed_time": "4:26:13", "remaining_time": "0:16:20", "throughput": 4081.21, "total_tokens": 65189488} +{"current_steps": 112460, "total_steps": 119360, "loss": 0.2771, "lr": 1.014814299910738e-07, "epoch": 18.843833780160857, "percentage": 94.22, "elapsed_time": "4:26:13", "remaining_time": "0:16:20", "throughput": 4081.21, "total_tokens": 65192144} +{"current_steps": 112465, "total_steps": 119360, "loss": 0.1429, "lr": 1.0133492860622041e-07, "epoch": 18.844671581769436, "percentage": 94.22, "elapsed_time": "4:26:14", "remaining_time": "0:16:19", "throughput": 4081.22, "total_tokens": 65195024} +{"current_steps": 112470, "total_steps": 119360, "loss": 0.2878, "lr": 1.0118853196191936e-07, "epoch": 18.845509383378015, "percentage": 94.23, "elapsed_time": "4:26:15", "remaining_time": "0:16:18", "throughput": 4081.22, "total_tokens": 65197744} +{"current_steps": 112475, "total_steps": 119360, "loss": 0.2938, "lr": 1.0104224006130092e-07, "epoch": 18.846347184986595, "percentage": 94.23, "elapsed_time": "4:26:15", "remaining_time": "0:16:17", "throughput": 4081.23, "total_tokens": 65200464} +{"current_steps": 112480, "total_steps": 119360, "loss": 0.494, "lr": 1.0089605290749372e-07, "epoch": 18.847184986595174, "percentage": 94.24, "elapsed_time": "4:26:16", "remaining_time": "0:16:17", "throughput": 4081.24, "total_tokens": 65203440} +{"current_steps": 112485, "total_steps": 119360, "loss": 0.3974, "lr": 1.0074997050362245e-07, "epoch": 18.848022788203753, "percentage": 94.24, "elapsed_time": "4:26:17", "remaining_time": "0:16:16", "throughput": 4081.25, "total_tokens": 65206416} +{"current_steps": 112490, "total_steps": 119360, "loss": 0.2947, "lr": 1.0060399285281241e-07, "epoch": 18.848860589812332, "percentage": 94.24, "elapsed_time": "4:26:17", "remaining_time": "0:16:15", "throughput": 4081.26, "total_tokens": 65209456} +{"current_steps": 112495, "total_steps": 119360, "loss": 0.1942, "lr": 1.0045811995818222e-07, "epoch": 18.84969839142091, "percentage": 94.25, "elapsed_time": "4:26:18", "remaining_time": "0:16:15", "throughput": 4081.27, "total_tokens": 65212176} +{"current_steps": 112500, "total_steps": 119360, "loss": 0.1628, "lr": 1.0031235182285215e-07, "epoch": 18.85053619302949, "percentage": 94.25, "elapsed_time": "4:26:19", "remaining_time": "0:16:14", "throughput": 4081.28, "total_tokens": 65215344} +{"current_steps": 112505, "total_steps": 119360, "loss": 0.4947, "lr": 1.0016668844994027e-07, "epoch": 18.85137399463807, "percentage": 94.26, "elapsed_time": "4:26:19", "remaining_time": "0:16:13", "throughput": 4081.29, "total_tokens": 65218128} +{"current_steps": 112510, "total_steps": 119360, "loss": 0.2705, "lr": 1.0002112984255852e-07, "epoch": 18.85221179624665, "percentage": 94.26, "elapsed_time": "4:26:20", "remaining_time": "0:16:12", "throughput": 4081.3, "total_tokens": 65221136} +{"current_steps": 112515, "total_steps": 119360, "loss": 0.4221, "lr": 9.987567600382053e-08, "epoch": 18.85304959785523, "percentage": 94.27, "elapsed_time": "4:26:21", "remaining_time": "0:16:12", "throughput": 4081.31, "total_tokens": 65224304} +{"current_steps": 112520, "total_steps": 119360, "loss": 0.1799, "lr": 9.973032693683715e-08, "epoch": 18.853887399463808, "percentage": 94.27, "elapsed_time": "4:26:21", "remaining_time": "0:16:11", "throughput": 4081.33, "total_tokens": 65227280} +{"current_steps": 112525, "total_steps": 119360, "loss": 0.4132, "lr": 9.958508264471423e-08, "epoch": 18.854725201072387, "percentage": 94.27, "elapsed_time": "4:26:22", "remaining_time": "0:16:10", "throughput": 4081.33, "total_tokens": 65230096} +{"current_steps": 112530, "total_steps": 119360, "loss": 0.5125, "lr": 9.943994313055871e-08, "epoch": 18.855563002680967, "percentage": 94.28, "elapsed_time": "4:26:23", "remaining_time": "0:16:10", "throughput": 4081.34, "total_tokens": 65233008} +{"current_steps": 112535, "total_steps": 119360, "loss": 0.3538, "lr": 9.929490839747314e-08, "epoch": 18.856400804289546, "percentage": 94.28, "elapsed_time": "4:26:23", "remaining_time": "0:16:09", "throughput": 4081.36, "total_tokens": 65236240} +{"current_steps": 112540, "total_steps": 119360, "loss": 0.2264, "lr": 9.91499784485589e-08, "epoch": 18.85723860589812, "percentage": 94.29, "elapsed_time": "4:26:24", "remaining_time": "0:16:08", "throughput": 4081.37, "total_tokens": 65239152} +{"current_steps": 112545, "total_steps": 119360, "loss": 0.1815, "lr": 9.900515328691463e-08, "epoch": 18.8580764075067, "percentage": 94.29, "elapsed_time": "4:26:25", "remaining_time": "0:16:07", "throughput": 4081.38, "total_tokens": 65242192} +{"current_steps": 112550, "total_steps": 119360, "loss": 0.3339, "lr": 9.886043291563784e-08, "epoch": 18.85891420911528, "percentage": 94.29, "elapsed_time": "4:26:26", "remaining_time": "0:16:07", "throughput": 4081.39, "total_tokens": 65245104} +{"current_steps": 112555, "total_steps": 119360, "loss": 0.3957, "lr": 9.871581733782054e-08, "epoch": 18.85975201072386, "percentage": 94.3, "elapsed_time": "4:26:26", "remaining_time": "0:16:06", "throughput": 4081.4, "total_tokens": 65248048} +{"current_steps": 112560, "total_steps": 119360, "loss": 0.2727, "lr": 9.857130655655744e-08, "epoch": 18.86058981233244, "percentage": 94.3, "elapsed_time": "4:26:27", "remaining_time": "0:16:05", "throughput": 4081.41, "total_tokens": 65250768} +{"current_steps": 112565, "total_steps": 119360, "loss": 0.2737, "lr": 9.842690057493775e-08, "epoch": 18.861427613941018, "percentage": 94.31, "elapsed_time": "4:26:27", "remaining_time": "0:16:05", "throughput": 4081.42, "total_tokens": 65253552} +{"current_steps": 112570, "total_steps": 119360, "loss": 0.384, "lr": 9.828259939604789e-08, "epoch": 18.862265415549597, "percentage": 94.31, "elapsed_time": "4:26:28", "remaining_time": "0:16:04", "throughput": 4081.42, "total_tokens": 65256304} +{"current_steps": 112575, "total_steps": 119360, "loss": 0.303, "lr": 9.813840302297317e-08, "epoch": 18.863103217158177, "percentage": 94.32, "elapsed_time": "4:26:29", "remaining_time": "0:16:03", "throughput": 4081.44, "total_tokens": 65259376} +{"current_steps": 112580, "total_steps": 119360, "loss": 0.1047, "lr": 9.799431145879889e-08, "epoch": 18.863941018766756, "percentage": 94.32, "elapsed_time": "4:26:29", "remaining_time": "0:16:02", "throughput": 4081.44, "total_tokens": 65262288} +{"current_steps": 112585, "total_steps": 119360, "loss": 0.1723, "lr": 9.785032470660372e-08, "epoch": 18.864778820375335, "percentage": 94.32, "elapsed_time": "4:26:30", "remaining_time": "0:16:02", "throughput": 4081.46, "total_tokens": 65265360} +{"current_steps": 112590, "total_steps": 119360, "loss": 0.4162, "lr": 9.770644276946739e-08, "epoch": 18.865616621983914, "percentage": 94.33, "elapsed_time": "4:26:31", "remaining_time": "0:16:01", "throughput": 4081.47, "total_tokens": 65268400} +{"current_steps": 112595, "total_steps": 119360, "loss": 0.2848, "lr": 9.756266565046691e-08, "epoch": 18.866454423592494, "percentage": 94.33, "elapsed_time": "4:26:32", "remaining_time": "0:16:00", "throughput": 4081.49, "total_tokens": 65271472} +{"current_steps": 112600, "total_steps": 119360, "loss": 0.3411, "lr": 9.741899335267425e-08, "epoch": 18.867292225201073, "percentage": 94.34, "elapsed_time": "4:26:32", "remaining_time": "0:16:00", "throughput": 4081.5, "total_tokens": 65274256} +{"current_steps": 112605, "total_steps": 119360, "loss": 0.3086, "lr": 9.727542587916306e-08, "epoch": 18.868130026809652, "percentage": 94.34, "elapsed_time": "4:26:33", "remaining_time": "0:15:59", "throughput": 4081.5, "total_tokens": 65276944} +{"current_steps": 112610, "total_steps": 119360, "loss": 0.2014, "lr": 9.713196323300312e-08, "epoch": 18.86896782841823, "percentage": 94.34, "elapsed_time": "4:26:34", "remaining_time": "0:15:58", "throughput": 4081.51, "total_tokens": 65279856} +{"current_steps": 112615, "total_steps": 119360, "loss": 0.4072, "lr": 9.698860541726085e-08, "epoch": 18.86980563002681, "percentage": 94.35, "elapsed_time": "4:26:34", "remaining_time": "0:15:57", "throughput": 4081.52, "total_tokens": 65282928} +{"current_steps": 112620, "total_steps": 119360, "loss": 0.2732, "lr": 9.684535243500159e-08, "epoch": 18.87064343163539, "percentage": 94.35, "elapsed_time": "4:26:35", "remaining_time": "0:15:57", "throughput": 4081.54, "total_tokens": 65285872} +{"current_steps": 112625, "total_steps": 119360, "loss": 0.3905, "lr": 9.670220428928956e-08, "epoch": 18.87148123324397, "percentage": 94.36, "elapsed_time": "4:26:36", "remaining_time": "0:15:56", "throughput": 4081.55, "total_tokens": 65288912} +{"current_steps": 112630, "total_steps": 119360, "loss": 0.3711, "lr": 9.655916098318396e-08, "epoch": 18.87231903485255, "percentage": 94.36, "elapsed_time": "4:26:36", "remaining_time": "0:15:55", "throughput": 4081.56, "total_tokens": 65291664} +{"current_steps": 112635, "total_steps": 119360, "loss": 0.3435, "lr": 9.641622251974458e-08, "epoch": 18.873156836461128, "percentage": 94.37, "elapsed_time": "4:26:37", "remaining_time": "0:15:55", "throughput": 4081.57, "total_tokens": 65294672} +{"current_steps": 112640, "total_steps": 119360, "loss": 0.2203, "lr": 9.62733889020262e-08, "epoch": 18.873994638069703, "percentage": 94.37, "elapsed_time": "4:26:38", "remaining_time": "0:15:54", "throughput": 4081.58, "total_tokens": 65297648} +{"current_steps": 112645, "total_steps": 119360, "loss": 0.4533, "lr": 9.613066013308414e-08, "epoch": 18.874832439678283, "percentage": 94.37, "elapsed_time": "4:26:38", "remaining_time": "0:15:53", "throughput": 4081.59, "total_tokens": 65300304} +{"current_steps": 112650, "total_steps": 119360, "loss": 0.5106, "lr": 9.59880362159693e-08, "epoch": 18.875670241286862, "percentage": 94.38, "elapsed_time": "4:26:39", "remaining_time": "0:15:53", "throughput": 4081.6, "total_tokens": 65303280} +{"current_steps": 112655, "total_steps": 119360, "loss": 0.2268, "lr": 9.584551715373147e-08, "epoch": 18.87650804289544, "percentage": 94.38, "elapsed_time": "4:26:40", "remaining_time": "0:15:52", "throughput": 4081.61, "total_tokens": 65306128} +{"current_steps": 112660, "total_steps": 119360, "loss": 0.1518, "lr": 9.570310294941765e-08, "epoch": 18.87734584450402, "percentage": 94.39, "elapsed_time": "4:26:40", "remaining_time": "0:15:51", "throughput": 4081.61, "total_tokens": 65308880} +{"current_steps": 112665, "total_steps": 119360, "loss": 0.4189, "lr": 9.556079360607318e-08, "epoch": 18.8781836461126, "percentage": 94.39, "elapsed_time": "4:26:41", "remaining_time": "0:15:50", "throughput": 4081.61, "total_tokens": 65311632} +{"current_steps": 112670, "total_steps": 119360, "loss": 0.5196, "lr": 9.541858912674173e-08, "epoch": 18.87902144772118, "percentage": 94.4, "elapsed_time": "4:26:42", "remaining_time": "0:15:50", "throughput": 4081.62, "total_tokens": 65314480} +{"current_steps": 112675, "total_steps": 119360, "loss": 0.2814, "lr": 9.5276489514462e-08, "epoch": 18.87985924932976, "percentage": 94.4, "elapsed_time": "4:26:42", "remaining_time": "0:15:49", "throughput": 4081.62, "total_tokens": 65316976} +{"current_steps": 112680, "total_steps": 119360, "loss": 0.346, "lr": 9.513449477227266e-08, "epoch": 18.880697050938338, "percentage": 94.4, "elapsed_time": "4:26:43", "remaining_time": "0:15:48", "throughput": 4081.63, "total_tokens": 65319984} +{"current_steps": 112685, "total_steps": 119360, "loss": 0.4887, "lr": 9.499260490321183e-08, "epoch": 18.881534852546917, "percentage": 94.41, "elapsed_time": "4:26:44", "remaining_time": "0:15:48", "throughput": 4081.65, "total_tokens": 65323440} +{"current_steps": 112690, "total_steps": 119360, "loss": 0.4568, "lr": 9.485081991031042e-08, "epoch": 18.882372654155496, "percentage": 94.41, "elapsed_time": "4:26:44", "remaining_time": "0:15:47", "throughput": 4081.66, "total_tokens": 65326384} +{"current_steps": 112695, "total_steps": 119360, "loss": 0.2574, "lr": 9.470913979660212e-08, "epoch": 18.883210455764075, "percentage": 94.42, "elapsed_time": "4:26:45", "remaining_time": "0:15:46", "throughput": 4081.67, "total_tokens": 65329200} +{"current_steps": 112700, "total_steps": 119360, "loss": 0.1456, "lr": 9.456756456511506e-08, "epoch": 18.884048257372655, "percentage": 94.42, "elapsed_time": "4:26:46", "remaining_time": "0:15:45", "throughput": 4081.68, "total_tokens": 65332400} +{"current_steps": 112705, "total_steps": 119360, "loss": 0.4375, "lr": 9.442609421887683e-08, "epoch": 18.884886058981234, "percentage": 94.42, "elapsed_time": "4:26:46", "remaining_time": "0:15:45", "throughput": 4081.69, "total_tokens": 65335408} +{"current_steps": 112710, "total_steps": 119360, "loss": 0.5554, "lr": 9.428472876091222e-08, "epoch": 18.885723860589813, "percentage": 94.43, "elapsed_time": "4:26:47", "remaining_time": "0:15:44", "throughput": 4081.7, "total_tokens": 65338064} +{"current_steps": 112715, "total_steps": 119360, "loss": 0.4073, "lr": 9.414346819424436e-08, "epoch": 18.886561662198392, "percentage": 94.43, "elapsed_time": "4:26:48", "remaining_time": "0:15:43", "throughput": 4081.7, "total_tokens": 65340752} +{"current_steps": 112720, "total_steps": 119360, "loss": 0.2048, "lr": 9.400231252189196e-08, "epoch": 18.88739946380697, "percentage": 94.44, "elapsed_time": "4:26:48", "remaining_time": "0:15:43", "throughput": 4081.71, "total_tokens": 65343760} +{"current_steps": 112725, "total_steps": 119360, "loss": 0.5578, "lr": 9.386126174687482e-08, "epoch": 18.88823726541555, "percentage": 94.44, "elapsed_time": "4:26:49", "remaining_time": "0:15:42", "throughput": 4081.72, "total_tokens": 65346512} +{"current_steps": 112730, "total_steps": 119360, "loss": 0.4231, "lr": 9.372031587220831e-08, "epoch": 18.88907506702413, "percentage": 94.45, "elapsed_time": "4:26:50", "remaining_time": "0:15:41", "throughput": 4081.73, "total_tokens": 65349360} +{"current_steps": 112735, "total_steps": 119360, "loss": 0.4193, "lr": 9.357947490090613e-08, "epoch": 18.889912868632706, "percentage": 94.45, "elapsed_time": "4:26:50", "remaining_time": "0:15:40", "throughput": 4081.73, "total_tokens": 65352048} +{"current_steps": 112740, "total_steps": 119360, "loss": 0.3143, "lr": 9.343873883597865e-08, "epoch": 18.890750670241285, "percentage": 94.45, "elapsed_time": "4:26:51", "remaining_time": "0:15:40", "throughput": 4081.74, "total_tokens": 65354832} +{"current_steps": 112745, "total_steps": 119360, "loss": 0.2989, "lr": 9.329810768043678e-08, "epoch": 18.891588471849865, "percentage": 94.46, "elapsed_time": "4:26:52", "remaining_time": "0:15:39", "throughput": 4081.75, "total_tokens": 65357648} +{"current_steps": 112750, "total_steps": 119360, "loss": 0.3299, "lr": 9.315758143728593e-08, "epoch": 18.892426273458444, "percentage": 94.46, "elapsed_time": "4:26:52", "remaining_time": "0:15:38", "throughput": 4081.76, "total_tokens": 65360912} +{"current_steps": 112755, "total_steps": 119360, "loss": 0.1278, "lr": 9.301716010953143e-08, "epoch": 18.893264075067023, "percentage": 94.47, "elapsed_time": "4:26:53", "remaining_time": "0:15:38", "throughput": 4081.77, "total_tokens": 65363888} +{"current_steps": 112760, "total_steps": 119360, "loss": 0.3835, "lr": 9.287684370017591e-08, "epoch": 18.894101876675602, "percentage": 94.47, "elapsed_time": "4:26:54", "remaining_time": "0:15:37", "throughput": 4081.79, "total_tokens": 65366960} +{"current_steps": 112765, "total_steps": 119360, "loss": 0.1504, "lr": 9.273663221221806e-08, "epoch": 18.89493967828418, "percentage": 94.47, "elapsed_time": "4:26:54", "remaining_time": "0:15:36", "throughput": 4081.79, "total_tokens": 65369936} +{"current_steps": 112770, "total_steps": 119360, "loss": 0.2153, "lr": 9.259652564865773e-08, "epoch": 18.89577747989276, "percentage": 94.48, "elapsed_time": "4:26:55", "remaining_time": "0:15:35", "throughput": 4081.8, "total_tokens": 65372880} +{"current_steps": 112775, "total_steps": 119360, "loss": 0.6453, "lr": 9.245652401249028e-08, "epoch": 18.89661528150134, "percentage": 94.48, "elapsed_time": "4:26:56", "remaining_time": "0:15:35", "throughput": 4081.82, "total_tokens": 65375568} +{"current_steps": 112780, "total_steps": 119360, "loss": 0.1965, "lr": 9.231662730670832e-08, "epoch": 18.89745308310992, "percentage": 94.49, "elapsed_time": "4:26:56", "remaining_time": "0:15:34", "throughput": 4081.83, "total_tokens": 65378608} +{"current_steps": 112785, "total_steps": 119360, "loss": 0.3273, "lr": 9.217683553430279e-08, "epoch": 18.8982908847185, "percentage": 94.49, "elapsed_time": "4:26:57", "remaining_time": "0:15:33", "throughput": 4081.85, "total_tokens": 65381712} +{"current_steps": 112790, "total_steps": 119360, "loss": 0.18, "lr": 9.203714869826408e-08, "epoch": 18.899128686327078, "percentage": 94.5, "elapsed_time": "4:26:58", "remaining_time": "0:15:33", "throughput": 4081.86, "total_tokens": 65384752} +{"current_steps": 112795, "total_steps": 119360, "loss": 0.2345, "lr": 9.189756680157758e-08, "epoch": 18.899966487935657, "percentage": 94.5, "elapsed_time": "4:26:59", "remaining_time": "0:15:32", "throughput": 4081.87, "total_tokens": 65387664} +{"current_steps": 112800, "total_steps": 119360, "loss": 0.2421, "lr": 9.175808984722868e-08, "epoch": 18.900804289544237, "percentage": 94.5, "elapsed_time": "4:26:59", "remaining_time": "0:15:31", "throughput": 4081.88, "total_tokens": 65390736} +{"current_steps": 112805, "total_steps": 119360, "loss": 0.3325, "lr": 9.161871783819887e-08, "epoch": 18.901642091152816, "percentage": 94.51, "elapsed_time": "4:27:00", "remaining_time": "0:15:30", "throughput": 4081.89, "total_tokens": 65393392} +{"current_steps": 112810, "total_steps": 119360, "loss": 0.4578, "lr": 9.147945077746855e-08, "epoch": 18.902479892761395, "percentage": 94.51, "elapsed_time": "4:27:01", "remaining_time": "0:15:30", "throughput": 4081.9, "total_tokens": 65396336} +{"current_steps": 112815, "total_steps": 119360, "loss": 0.1364, "lr": 9.13402886680148e-08, "epoch": 18.903317694369974, "percentage": 94.52, "elapsed_time": "4:27:01", "remaining_time": "0:15:29", "throughput": 4081.92, "total_tokens": 65399440} +{"current_steps": 112820, "total_steps": 119360, "loss": 0.4932, "lr": 9.120123151281469e-08, "epoch": 18.904155495978554, "percentage": 94.52, "elapsed_time": "4:27:02", "remaining_time": "0:15:28", "throughput": 4081.92, "total_tokens": 65402192} +{"current_steps": 112825, "total_steps": 119360, "loss": 0.3858, "lr": 9.106227931483913e-08, "epoch": 18.904993297587133, "percentage": 94.52, "elapsed_time": "4:27:03", "remaining_time": "0:15:28", "throughput": 4081.93, "total_tokens": 65405168} +{"current_steps": 112830, "total_steps": 119360, "loss": 0.4627, "lr": 9.092343207706134e-08, "epoch": 18.905831099195712, "percentage": 94.53, "elapsed_time": "4:27:03", "remaining_time": "0:15:27", "throughput": 4081.94, "total_tokens": 65407952} +{"current_steps": 112835, "total_steps": 119360, "loss": 0.2467, "lr": 9.078468980244892e-08, "epoch": 18.906668900804288, "percentage": 94.53, "elapsed_time": "4:27:04", "remaining_time": "0:15:26", "throughput": 4081.94, "total_tokens": 65410736} +{"current_steps": 112840, "total_steps": 119360, "loss": 0.261, "lr": 9.06460524939684e-08, "epoch": 18.907506702412867, "percentage": 94.54, "elapsed_time": "4:27:05", "remaining_time": "0:15:25", "throughput": 4081.95, "total_tokens": 65413744} +{"current_steps": 112845, "total_steps": 119360, "loss": 0.4282, "lr": 9.050752015458408e-08, "epoch": 18.908344504021446, "percentage": 94.54, "elapsed_time": "4:27:05", "remaining_time": "0:15:25", "throughput": 4081.97, "total_tokens": 65416848} +{"current_steps": 112850, "total_steps": 119360, "loss": 0.1512, "lr": 9.036909278725858e-08, "epoch": 18.909182305630026, "percentage": 94.55, "elapsed_time": "4:27:06", "remaining_time": "0:15:24", "throughput": 4081.98, "total_tokens": 65419696} +{"current_steps": 112855, "total_steps": 119360, "loss": 0.4954, "lr": 9.023077039495121e-08, "epoch": 18.910020107238605, "percentage": 94.55, "elapsed_time": "4:27:07", "remaining_time": "0:15:23", "throughput": 4082.0, "total_tokens": 65422896} +{"current_steps": 112860, "total_steps": 119360, "loss": 0.451, "lr": 9.009255298061959e-08, "epoch": 18.910857908847184, "percentage": 94.55, "elapsed_time": "4:27:07", "remaining_time": "0:15:23", "throughput": 4082.01, "total_tokens": 65425744} +{"current_steps": 112865, "total_steps": 119360, "loss": 0.0736, "lr": 8.995444054721858e-08, "epoch": 18.911695710455763, "percentage": 94.56, "elapsed_time": "4:27:08", "remaining_time": "0:15:22", "throughput": 4082.02, "total_tokens": 65428720} +{"current_steps": 112870, "total_steps": 119360, "loss": 0.135, "lr": 8.981643309770138e-08, "epoch": 18.912533512064343, "percentage": 94.56, "elapsed_time": "4:27:09", "remaining_time": "0:15:21", "throughput": 4082.03, "total_tokens": 65431568} +{"current_steps": 112875, "total_steps": 119360, "loss": 0.1885, "lr": 8.967853063501952e-08, "epoch": 18.913371313672922, "percentage": 94.57, "elapsed_time": "4:27:09", "remaining_time": "0:15:20", "throughput": 4082.03, "total_tokens": 65434480} +{"current_steps": 112880, "total_steps": 119360, "loss": 0.4257, "lr": 8.95407331621212e-08, "epoch": 18.9142091152815, "percentage": 94.57, "elapsed_time": "4:27:10", "remaining_time": "0:15:20", "throughput": 4082.04, "total_tokens": 65437264} +{"current_steps": 112885, "total_steps": 119360, "loss": 0.4725, "lr": 8.940304068195182e-08, "epoch": 18.91504691689008, "percentage": 94.58, "elapsed_time": "4:27:11", "remaining_time": "0:15:19", "throughput": 4082.06, "total_tokens": 65440432} +{"current_steps": 112890, "total_steps": 119360, "loss": 0.3758, "lr": 8.926545319745683e-08, "epoch": 18.91588471849866, "percentage": 94.58, "elapsed_time": "4:27:11", "remaining_time": "0:15:18", "throughput": 4082.06, "total_tokens": 65443088} +{"current_steps": 112895, "total_steps": 119360, "loss": 0.4517, "lr": 8.91279707115772e-08, "epoch": 18.91672252010724, "percentage": 94.58, "elapsed_time": "4:27:12", "remaining_time": "0:15:18", "throughput": 4082.07, "total_tokens": 65445968} +{"current_steps": 112900, "total_steps": 119360, "loss": 0.2818, "lr": 8.899059322725278e-08, "epoch": 18.91756032171582, "percentage": 94.59, "elapsed_time": "4:27:13", "remaining_time": "0:15:17", "throughput": 4082.09, "total_tokens": 65449104} +{"current_steps": 112905, "total_steps": 119360, "loss": 0.7382, "lr": 8.885332074742014e-08, "epoch": 18.918398123324398, "percentage": 94.59, "elapsed_time": "4:27:13", "remaining_time": "0:15:16", "throughput": 4082.09, "total_tokens": 65451920} +{"current_steps": 112910, "total_steps": 119360, "loss": 0.4956, "lr": 8.871615327501638e-08, "epoch": 18.919235924932977, "percentage": 94.6, "elapsed_time": "4:27:14", "remaining_time": "0:15:15", "throughput": 4082.1, "total_tokens": 65454704} +{"current_steps": 112915, "total_steps": 119360, "loss": 0.5005, "lr": 8.85790908129719e-08, "epoch": 18.920073726541556, "percentage": 94.6, "elapsed_time": "4:27:15", "remaining_time": "0:15:15", "throughput": 4082.11, "total_tokens": 65457584} +{"current_steps": 112920, "total_steps": 119360, "loss": 0.2722, "lr": 8.84421333642188e-08, "epoch": 18.920911528150135, "percentage": 94.6, "elapsed_time": "4:27:15", "remaining_time": "0:15:14", "throughput": 4082.13, "total_tokens": 65460688} +{"current_steps": 112925, "total_steps": 119360, "loss": 0.1651, "lr": 8.830528093168533e-08, "epoch": 18.921749329758715, "percentage": 94.61, "elapsed_time": "4:27:16", "remaining_time": "0:15:13", "throughput": 4082.13, "total_tokens": 65463472} +{"current_steps": 112930, "total_steps": 119360, "loss": 0.3532, "lr": 8.81685335182969e-08, "epoch": 18.922587131367294, "percentage": 94.61, "elapsed_time": "4:27:17", "remaining_time": "0:15:13", "throughput": 4082.14, "total_tokens": 65466192} +{"current_steps": 112935, "total_steps": 119360, "loss": 0.5238, "lr": 8.80318911269773e-08, "epoch": 18.92342493297587, "percentage": 94.62, "elapsed_time": "4:27:17", "remaining_time": "0:15:12", "throughput": 4082.15, "total_tokens": 65469040} +{"current_steps": 112940, "total_steps": 119360, "loss": 0.2269, "lr": 8.789535376064973e-08, "epoch": 18.92426273458445, "percentage": 94.62, "elapsed_time": "4:27:18", "remaining_time": "0:15:11", "throughput": 4082.16, "total_tokens": 65472048} +{"current_steps": 112945, "total_steps": 119360, "loss": 0.3961, "lr": 8.775892142223186e-08, "epoch": 18.92510053619303, "percentage": 94.63, "elapsed_time": "4:27:19", "remaining_time": "0:15:10", "throughput": 4082.16, "total_tokens": 65474864} +{"current_steps": 112950, "total_steps": 119360, "loss": 0.3101, "lr": 8.76225941146408e-08, "epoch": 18.925938337801608, "percentage": 94.63, "elapsed_time": "4:27:19", "remaining_time": "0:15:10", "throughput": 4082.17, "total_tokens": 65477520} +{"current_steps": 112955, "total_steps": 119360, "loss": 0.4213, "lr": 8.748637184079312e-08, "epoch": 18.926776139410187, "percentage": 94.63, "elapsed_time": "4:27:20", "remaining_time": "0:15:09", "throughput": 4082.17, "total_tokens": 65480368} +{"current_steps": 112960, "total_steps": 119360, "loss": 0.2989, "lr": 8.73502546035998e-08, "epoch": 18.927613941018766, "percentage": 94.64, "elapsed_time": "4:27:21", "remaining_time": "0:15:08", "throughput": 4082.17, "total_tokens": 65483056} +{"current_steps": 112965, "total_steps": 119360, "loss": 0.3712, "lr": 8.721424240597187e-08, "epoch": 18.928451742627345, "percentage": 94.64, "elapsed_time": "4:27:21", "remaining_time": "0:15:08", "throughput": 4082.18, "total_tokens": 65485712} +{"current_steps": 112970, "total_steps": 119360, "loss": 0.3609, "lr": 8.7078335250817e-08, "epoch": 18.929289544235925, "percentage": 94.65, "elapsed_time": "4:27:22", "remaining_time": "0:15:07", "throughput": 4082.19, "total_tokens": 65488624} +{"current_steps": 112975, "total_steps": 119360, "loss": 0.6747, "lr": 8.694253314104173e-08, "epoch": 18.930127345844504, "percentage": 94.65, "elapsed_time": "4:27:23", "remaining_time": "0:15:06", "throughput": 4082.19, "total_tokens": 65491536} +{"current_steps": 112980, "total_steps": 119360, "loss": 0.4789, "lr": 8.680683607954987e-08, "epoch": 18.930965147453083, "percentage": 94.65, "elapsed_time": "4:27:23", "remaining_time": "0:15:06", "throughput": 4082.21, "total_tokens": 65494608} +{"current_steps": 112985, "total_steps": 119360, "loss": 0.1642, "lr": 8.667124406924188e-08, "epoch": 18.931802949061662, "percentage": 94.66, "elapsed_time": "4:27:24", "remaining_time": "0:15:05", "throughput": 4082.22, "total_tokens": 65497616} +{"current_steps": 112990, "total_steps": 119360, "loss": 0.2282, "lr": 8.65357571130171e-08, "epoch": 18.93264075067024, "percentage": 94.66, "elapsed_time": "4:27:25", "remaining_time": "0:15:04", "throughput": 4082.22, "total_tokens": 65500240} +{"current_steps": 112995, "total_steps": 119360, "loss": 0.4254, "lr": 8.64003752137732e-08, "epoch": 18.93347855227882, "percentage": 94.67, "elapsed_time": "4:27:25", "remaining_time": "0:15:03", "throughput": 4082.23, "total_tokens": 65503056} +{"current_steps": 113000, "total_steps": 119360, "loss": 0.3469, "lr": 8.626509837440456e-08, "epoch": 18.9343163538874, "percentage": 94.67, "elapsed_time": "4:27:26", "remaining_time": "0:15:03", "throughput": 4082.24, "total_tokens": 65505776} +{"current_steps": 113005, "total_steps": 119360, "loss": 0.4911, "lr": 8.612992659780328e-08, "epoch": 18.93515415549598, "percentage": 94.68, "elapsed_time": "4:27:27", "remaining_time": "0:15:02", "throughput": 4082.25, "total_tokens": 65508816} +{"current_steps": 113010, "total_steps": 119360, "loss": 0.6144, "lr": 8.599485988685874e-08, "epoch": 18.93599195710456, "percentage": 94.68, "elapsed_time": "4:27:27", "remaining_time": "0:15:01", "throughput": 4082.26, "total_tokens": 65511728} +{"current_steps": 113015, "total_steps": 119360, "loss": 0.3208, "lr": 8.585989824446139e-08, "epoch": 18.936829758713138, "percentage": 94.68, "elapsed_time": "4:27:28", "remaining_time": "0:15:01", "throughput": 4082.27, "total_tokens": 65514448} +{"current_steps": 113020, "total_steps": 119360, "loss": 0.2336, "lr": 8.572504167349449e-08, "epoch": 18.937667560321717, "percentage": 94.69, "elapsed_time": "4:27:29", "remaining_time": "0:15:00", "throughput": 4082.27, "total_tokens": 65517200} +{"current_steps": 113025, "total_steps": 119360, "loss": 0.1758, "lr": 8.559029017684184e-08, "epoch": 18.938505361930297, "percentage": 94.69, "elapsed_time": "4:27:29", "remaining_time": "0:14:59", "throughput": 4082.28, "total_tokens": 65519856} +{"current_steps": 113030, "total_steps": 119360, "loss": 0.287, "lr": 8.545564375738557e-08, "epoch": 18.939343163538872, "percentage": 94.7, "elapsed_time": "4:27:30", "remaining_time": "0:14:58", "throughput": 4082.29, "total_tokens": 65522928} +{"current_steps": 113035, "total_steps": 119360, "loss": 0.492, "lr": 8.532110241800396e-08, "epoch": 18.94018096514745, "percentage": 94.7, "elapsed_time": "4:27:31", "remaining_time": "0:14:58", "throughput": 4082.31, "total_tokens": 65526096} +{"current_steps": 113040, "total_steps": 119360, "loss": 0.431, "lr": 8.518666616157412e-08, "epoch": 18.94101876675603, "percentage": 94.71, "elapsed_time": "4:27:31", "remaining_time": "0:14:57", "throughput": 4082.32, "total_tokens": 65529040} +{"current_steps": 113045, "total_steps": 119360, "loss": 0.4279, "lr": 8.505233499097043e-08, "epoch": 18.94185656836461, "percentage": 94.71, "elapsed_time": "4:27:32", "remaining_time": "0:14:56", "throughput": 4082.33, "total_tokens": 65531920} +{"current_steps": 113050, "total_steps": 119360, "loss": 0.4192, "lr": 8.491810890906394e-08, "epoch": 18.94269436997319, "percentage": 94.71, "elapsed_time": "4:27:33", "remaining_time": "0:14:56", "throughput": 4082.33, "total_tokens": 65534832} +{"current_steps": 113055, "total_steps": 119360, "loss": 0.3589, "lr": 8.478398791872566e-08, "epoch": 18.94353217158177, "percentage": 94.72, "elapsed_time": "4:27:33", "remaining_time": "0:14:55", "throughput": 4082.34, "total_tokens": 65537712} +{"current_steps": 113060, "total_steps": 119360, "loss": 0.2783, "lr": 8.464997202282444e-08, "epoch": 18.944369973190348, "percentage": 94.72, "elapsed_time": "4:27:34", "remaining_time": "0:14:54", "throughput": 4082.35, "total_tokens": 65540688} +{"current_steps": 113065, "total_steps": 119360, "loss": 0.4896, "lr": 8.451606122422351e-08, "epoch": 18.945207774798927, "percentage": 94.73, "elapsed_time": "4:27:35", "remaining_time": "0:14:53", "throughput": 4082.37, "total_tokens": 65543728} +{"current_steps": 113070, "total_steps": 119360, "loss": 0.4102, "lr": 8.438225552578672e-08, "epoch": 18.946045576407506, "percentage": 94.73, "elapsed_time": "4:27:35", "remaining_time": "0:14:53", "throughput": 4082.38, "total_tokens": 65546672} +{"current_steps": 113075, "total_steps": 119360, "loss": 0.294, "lr": 8.424855493037564e-08, "epoch": 18.946883378016086, "percentage": 94.73, "elapsed_time": "4:27:36", "remaining_time": "0:14:52", "throughput": 4082.39, "total_tokens": 65549456} +{"current_steps": 113080, "total_steps": 119360, "loss": 0.3078, "lr": 8.411495944084913e-08, "epoch": 18.947721179624665, "percentage": 94.74, "elapsed_time": "4:27:37", "remaining_time": "0:14:51", "throughput": 4082.39, "total_tokens": 65552176} +{"current_steps": 113085, "total_steps": 119360, "loss": 0.3367, "lr": 8.398146906006265e-08, "epoch": 18.948558981233244, "percentage": 94.74, "elapsed_time": "4:27:37", "remaining_time": "0:14:51", "throughput": 4082.41, "total_tokens": 65555216} +{"current_steps": 113090, "total_steps": 119360, "loss": 0.4925, "lr": 8.384808379087118e-08, "epoch": 18.949396782841823, "percentage": 94.75, "elapsed_time": "4:27:38", "remaining_time": "0:14:50", "throughput": 4082.42, "total_tokens": 65558160} +{"current_steps": 113095, "total_steps": 119360, "loss": 0.2519, "lr": 8.371480363612628e-08, "epoch": 18.950234584450403, "percentage": 94.75, "elapsed_time": "4:27:39", "remaining_time": "0:14:49", "throughput": 4082.43, "total_tokens": 65561168} +{"current_steps": 113100, "total_steps": 119360, "loss": 0.1549, "lr": 8.358162859867791e-08, "epoch": 18.951072386058982, "percentage": 94.76, "elapsed_time": "4:27:39", "remaining_time": "0:14:48", "throughput": 4082.44, "total_tokens": 65563824} +{"current_steps": 113105, "total_steps": 119360, "loss": 0.2824, "lr": 8.344855868137381e-08, "epoch": 18.95191018766756, "percentage": 94.76, "elapsed_time": "4:27:40", "remaining_time": "0:14:48", "throughput": 4082.45, "total_tokens": 65566800} +{"current_steps": 113110, "total_steps": 119360, "loss": 0.2489, "lr": 8.33155938870589e-08, "epoch": 18.95274798927614, "percentage": 94.76, "elapsed_time": "4:27:41", "remaining_time": "0:14:47", "throughput": 4082.46, "total_tokens": 65569744} +{"current_steps": 113115, "total_steps": 119360, "loss": 0.6421, "lr": 8.318273421857592e-08, "epoch": 18.95358579088472, "percentage": 94.77, "elapsed_time": "4:27:41", "remaining_time": "0:14:46", "throughput": 4082.47, "total_tokens": 65572496} +{"current_steps": 113120, "total_steps": 119360, "loss": 0.6956, "lr": 8.304997967876593e-08, "epoch": 18.9544235924933, "percentage": 94.77, "elapsed_time": "4:27:42", "remaining_time": "0:14:46", "throughput": 4082.47, "total_tokens": 65575248} +{"current_steps": 113125, "total_steps": 119360, "loss": 0.4454, "lr": 8.291733027046722e-08, "epoch": 18.95526139410188, "percentage": 94.78, "elapsed_time": "4:27:43", "remaining_time": "0:14:45", "throughput": 4082.48, "total_tokens": 65578000} +{"current_steps": 113130, "total_steps": 119360, "loss": 0.1647, "lr": 8.27847859965164e-08, "epoch": 18.956099195710454, "percentage": 94.78, "elapsed_time": "4:27:43", "remaining_time": "0:14:44", "throughput": 4082.49, "total_tokens": 65581040} +{"current_steps": 113135, "total_steps": 119360, "loss": 0.0883, "lr": 8.265234685974677e-08, "epoch": 18.956936997319033, "percentage": 94.78, "elapsed_time": "4:27:44", "remaining_time": "0:14:43", "throughput": 4082.49, "total_tokens": 65583728} +{"current_steps": 113140, "total_steps": 119360, "loss": 0.3832, "lr": 8.252001286299105e-08, "epoch": 18.957774798927613, "percentage": 94.79, "elapsed_time": "4:27:45", "remaining_time": "0:14:43", "throughput": 4082.5, "total_tokens": 65586544} +{"current_steps": 113145, "total_steps": 119360, "loss": 0.2271, "lr": 8.238778400907754e-08, "epoch": 18.958612600536192, "percentage": 94.79, "elapsed_time": "4:27:45", "remaining_time": "0:14:42", "throughput": 4082.51, "total_tokens": 65589328} +{"current_steps": 113150, "total_steps": 119360, "loss": 0.3206, "lr": 8.22556603008351e-08, "epoch": 18.95945040214477, "percentage": 94.8, "elapsed_time": "4:27:46", "remaining_time": "0:14:41", "throughput": 4082.52, "total_tokens": 65592176} +{"current_steps": 113155, "total_steps": 119360, "loss": 0.4228, "lr": 8.212364174108645e-08, "epoch": 18.96028820375335, "percentage": 94.8, "elapsed_time": "4:27:47", "remaining_time": "0:14:41", "throughput": 4082.52, "total_tokens": 65595056} +{"current_steps": 113160, "total_steps": 119360, "loss": 0.4745, "lr": 8.199172833265601e-08, "epoch": 18.96112600536193, "percentage": 94.81, "elapsed_time": "4:27:47", "remaining_time": "0:14:40", "throughput": 4082.54, "total_tokens": 65597936} +{"current_steps": 113165, "total_steps": 119360, "loss": 0.5512, "lr": 8.185992007836485e-08, "epoch": 18.96196380697051, "percentage": 94.81, "elapsed_time": "4:27:48", "remaining_time": "0:14:39", "throughput": 4082.55, "total_tokens": 65600848} +{"current_steps": 113170, "total_steps": 119360, "loss": 0.5452, "lr": 8.172821698102962e-08, "epoch": 18.96280160857909, "percentage": 94.81, "elapsed_time": "4:27:49", "remaining_time": "0:14:38", "throughput": 4082.56, "total_tokens": 65603760} +{"current_steps": 113175, "total_steps": 119360, "loss": 0.7111, "lr": 8.159661904346695e-08, "epoch": 18.963639410187668, "percentage": 94.82, "elapsed_time": "4:27:49", "remaining_time": "0:14:38", "throughput": 4082.57, "total_tokens": 65606768} +{"current_steps": 113180, "total_steps": 119360, "loss": 0.4428, "lr": 8.146512626849068e-08, "epoch": 18.964477211796247, "percentage": 94.82, "elapsed_time": "4:27:50", "remaining_time": "0:14:37", "throughput": 4082.58, "total_tokens": 65609584} +{"current_steps": 113185, "total_steps": 119360, "loss": 0.3164, "lr": 8.133373865891191e-08, "epoch": 18.965315013404826, "percentage": 94.83, "elapsed_time": "4:27:51", "remaining_time": "0:14:36", "throughput": 4082.58, "total_tokens": 65612336} +{"current_steps": 113190, "total_steps": 119360, "loss": 0.2716, "lr": 8.120245621754064e-08, "epoch": 18.966152815013405, "percentage": 94.83, "elapsed_time": "4:27:51", "remaining_time": "0:14:36", "throughput": 4082.6, "total_tokens": 65615184} +{"current_steps": 113195, "total_steps": 119360, "loss": 0.4511, "lr": 8.107127894718348e-08, "epoch": 18.966990616621985, "percentage": 94.83, "elapsed_time": "4:27:52", "remaining_time": "0:14:35", "throughput": 4082.61, "total_tokens": 65618416} +{"current_steps": 113200, "total_steps": 119360, "loss": 0.1369, "lr": 8.094020685064486e-08, "epoch": 18.967828418230564, "percentage": 94.84, "elapsed_time": "4:27:53", "remaining_time": "0:14:34", "throughput": 4082.62, "total_tokens": 65621296} +{"current_steps": 113205, "total_steps": 119360, "loss": 0.2801, "lr": 8.080923993072809e-08, "epoch": 18.968666219839143, "percentage": 94.84, "elapsed_time": "4:27:53", "remaining_time": "0:14:33", "throughput": 4082.62, "total_tokens": 65623984} +{"current_steps": 113210, "total_steps": 119360, "loss": 0.2958, "lr": 8.067837819023317e-08, "epoch": 18.969504021447722, "percentage": 94.85, "elapsed_time": "4:27:54", "remaining_time": "0:14:33", "throughput": 4082.63, "total_tokens": 65626800} +{"current_steps": 113215, "total_steps": 119360, "loss": 0.2739, "lr": 8.054762163195728e-08, "epoch": 18.9703418230563, "percentage": 94.85, "elapsed_time": "4:27:55", "remaining_time": "0:14:32", "throughput": 4082.64, "total_tokens": 65629616} +{"current_steps": 113220, "total_steps": 119360, "loss": 0.598, "lr": 8.04169702586971e-08, "epoch": 18.97117962466488, "percentage": 94.86, "elapsed_time": "4:27:55", "remaining_time": "0:14:31", "throughput": 4082.65, "total_tokens": 65632432} +{"current_steps": 113225, "total_steps": 119360, "loss": 0.4306, "lr": 8.028642407324594e-08, "epoch": 18.97201742627346, "percentage": 94.86, "elapsed_time": "4:27:56", "remaining_time": "0:14:31", "throughput": 4082.66, "total_tokens": 65635440} +{"current_steps": 113230, "total_steps": 119360, "loss": 0.2551, "lr": 8.01559830783949e-08, "epoch": 18.972855227882036, "percentage": 94.86, "elapsed_time": "4:27:57", "remaining_time": "0:14:30", "throughput": 4082.67, "total_tokens": 65638384} +{"current_steps": 113235, "total_steps": 119360, "loss": 0.4214, "lr": 8.002564727693285e-08, "epoch": 18.973693029490615, "percentage": 94.87, "elapsed_time": "4:27:58", "remaining_time": "0:14:29", "throughput": 4082.68, "total_tokens": 65641360} +{"current_steps": 113240, "total_steps": 119360, "loss": 0.4139, "lr": 7.989541667164702e-08, "epoch": 18.974530831099194, "percentage": 94.87, "elapsed_time": "4:27:58", "remaining_time": "0:14:28", "throughput": 4082.7, "total_tokens": 65644624} +{"current_steps": 113245, "total_steps": 119360, "loss": 0.4001, "lr": 7.976529126532184e-08, "epoch": 18.975368632707774, "percentage": 94.88, "elapsed_time": "4:27:59", "remaining_time": "0:14:28", "throughput": 4082.7, "total_tokens": 65647408} +{"current_steps": 113250, "total_steps": 119360, "loss": 0.319, "lr": 7.963527106073954e-08, "epoch": 18.976206434316353, "percentage": 94.88, "elapsed_time": "4:28:00", "remaining_time": "0:14:27", "throughput": 4082.71, "total_tokens": 65650096} +{"current_steps": 113255, "total_steps": 119360, "loss": 0.3902, "lr": 7.950535606067955e-08, "epoch": 18.977044235924932, "percentage": 94.89, "elapsed_time": "4:28:00", "remaining_time": "0:14:26", "throughput": 4082.72, "total_tokens": 65652976} +{"current_steps": 113260, "total_steps": 119360, "loss": 0.1584, "lr": 7.937554626792022e-08, "epoch": 18.97788203753351, "percentage": 94.89, "elapsed_time": "4:28:01", "remaining_time": "0:14:26", "throughput": 4082.73, "total_tokens": 65655792} +{"current_steps": 113265, "total_steps": 119360, "loss": 0.2004, "lr": 7.924584168523708e-08, "epoch": 18.97871983914209, "percentage": 94.89, "elapsed_time": "4:28:02", "remaining_time": "0:14:25", "throughput": 4082.73, "total_tokens": 65658512} +{"current_steps": 113270, "total_steps": 119360, "loss": 0.4694, "lr": 7.911624231540404e-08, "epoch": 18.97955764075067, "percentage": 94.9, "elapsed_time": "4:28:02", "remaining_time": "0:14:24", "throughput": 4082.74, "total_tokens": 65661168} +{"current_steps": 113275, "total_steps": 119360, "loss": 0.3616, "lr": 7.898674816119056e-08, "epoch": 18.98039544235925, "percentage": 94.9, "elapsed_time": "4:28:03", "remaining_time": "0:14:23", "throughput": 4082.75, "total_tokens": 65664208} +{"current_steps": 113280, "total_steps": 119360, "loss": 0.4178, "lr": 7.885735922536664e-08, "epoch": 18.98123324396783, "percentage": 94.91, "elapsed_time": "4:28:04", "remaining_time": "0:14:23", "throughput": 4082.76, "total_tokens": 65667152} +{"current_steps": 113285, "total_steps": 119360, "loss": 0.4337, "lr": 7.872807551069784e-08, "epoch": 18.982071045576408, "percentage": 94.91, "elapsed_time": "4:28:04", "remaining_time": "0:14:22", "throughput": 4082.77, "total_tokens": 65670256} +{"current_steps": 113290, "total_steps": 119360, "loss": 0.3342, "lr": 7.859889701994972e-08, "epoch": 18.982908847184987, "percentage": 94.91, "elapsed_time": "4:28:05", "remaining_time": "0:14:21", "throughput": 4082.78, "total_tokens": 65673264} +{"current_steps": 113295, "total_steps": 119360, "loss": 0.1858, "lr": 7.846982375588285e-08, "epoch": 18.983746648793566, "percentage": 94.92, "elapsed_time": "4:28:06", "remaining_time": "0:14:21", "throughput": 4082.8, "total_tokens": 65676400} +{"current_steps": 113300, "total_steps": 119360, "loss": 0.1516, "lr": 7.834085572125838e-08, "epoch": 18.984584450402146, "percentage": 94.92, "elapsed_time": "4:28:06", "remaining_time": "0:14:20", "throughput": 4082.8, "total_tokens": 65679056} +{"current_steps": 113305, "total_steps": 119360, "loss": 0.1828, "lr": 7.821199291883296e-08, "epoch": 18.985422252010725, "percentage": 94.93, "elapsed_time": "4:28:07", "remaining_time": "0:14:19", "throughput": 4082.8, "total_tokens": 65681616} +{"current_steps": 113310, "total_steps": 119360, "loss": 0.2114, "lr": 7.808323535136165e-08, "epoch": 18.986260053619304, "percentage": 94.93, "elapsed_time": "4:28:08", "remaining_time": "0:14:18", "throughput": 4082.81, "total_tokens": 65684432} +{"current_steps": 113315, "total_steps": 119360, "loss": 0.2544, "lr": 7.795458302159886e-08, "epoch": 18.987097855227884, "percentage": 94.94, "elapsed_time": "4:28:08", "remaining_time": "0:14:18", "throughput": 4082.82, "total_tokens": 65687312} +{"current_steps": 113320, "total_steps": 119360, "loss": 0.2146, "lr": 7.782603593229354e-08, "epoch": 18.987935656836463, "percentage": 94.94, "elapsed_time": "4:28:09", "remaining_time": "0:14:17", "throughput": 4082.83, "total_tokens": 65690448} +{"current_steps": 113325, "total_steps": 119360, "loss": 0.5205, "lr": 7.769759408619571e-08, "epoch": 18.98877345844504, "percentage": 94.94, "elapsed_time": "4:28:10", "remaining_time": "0:14:16", "throughput": 4082.84, "total_tokens": 65693360} +{"current_steps": 113330, "total_steps": 119360, "loss": 0.3273, "lr": 7.756925748605093e-08, "epoch": 18.989611260053618, "percentage": 94.95, "elapsed_time": "4:28:10", "remaining_time": "0:14:16", "throughput": 4082.84, "total_tokens": 65695984} +{"current_steps": 113335, "total_steps": 119360, "loss": 0.1591, "lr": 7.744102613460313e-08, "epoch": 18.990449061662197, "percentage": 94.95, "elapsed_time": "4:28:11", "remaining_time": "0:14:15", "throughput": 4082.85, "total_tokens": 65698768} +{"current_steps": 113340, "total_steps": 119360, "loss": 0.3718, "lr": 7.731290003459402e-08, "epoch": 18.991286863270776, "percentage": 94.96, "elapsed_time": "4:28:12", "remaining_time": "0:14:14", "throughput": 4082.86, "total_tokens": 65701616} +{"current_steps": 113345, "total_steps": 119360, "loss": 0.3313, "lr": 7.71848791887636e-08, "epoch": 18.992124664879356, "percentage": 94.96, "elapsed_time": "4:28:12", "remaining_time": "0:14:14", "throughput": 4082.86, "total_tokens": 65704496} +{"current_steps": 113350, "total_steps": 119360, "loss": 0.3734, "lr": 7.705696359984916e-08, "epoch": 18.992962466487935, "percentage": 94.96, "elapsed_time": "4:28:13", "remaining_time": "0:14:13", "throughput": 4082.87, "total_tokens": 65707280} +{"current_steps": 113355, "total_steps": 119360, "loss": 0.527, "lr": 7.692915327058514e-08, "epoch": 18.993800268096514, "percentage": 94.97, "elapsed_time": "4:28:14", "remaining_time": "0:14:12", "throughput": 4082.88, "total_tokens": 65710320} +{"current_steps": 113360, "total_steps": 119360, "loss": 0.6702, "lr": 7.68014482037044e-08, "epoch": 18.994638069705093, "percentage": 94.97, "elapsed_time": "4:28:14", "remaining_time": "0:14:11", "throughput": 4082.9, "total_tokens": 65713424} +{"current_steps": 113365, "total_steps": 119360, "loss": 0.2559, "lr": 7.667384840193804e-08, "epoch": 18.995475871313673, "percentage": 94.98, "elapsed_time": "4:28:15", "remaining_time": "0:14:11", "throughput": 4082.9, "total_tokens": 65716144} +{"current_steps": 113370, "total_steps": 119360, "loss": 0.4926, "lr": 7.654635386801446e-08, "epoch": 18.996313672922252, "percentage": 94.98, "elapsed_time": "4:28:16", "remaining_time": "0:14:10", "throughput": 4082.91, "total_tokens": 65718896} +{"current_steps": 113375, "total_steps": 119360, "loss": 0.4993, "lr": 7.64189646046587e-08, "epoch": 18.99715147453083, "percentage": 94.99, "elapsed_time": "4:28:16", "remaining_time": "0:14:09", "throughput": 4082.93, "total_tokens": 65721904} +{"current_steps": 113380, "total_steps": 119360, "loss": 0.303, "lr": 7.629168061459469e-08, "epoch": 18.99798927613941, "percentage": 94.99, "elapsed_time": "4:28:17", "remaining_time": "0:14:09", "throughput": 4082.93, "total_tokens": 65724624} +{"current_steps": 113385, "total_steps": 119360, "loss": 0.1808, "lr": 7.616450190054526e-08, "epoch": 18.99882707774799, "percentage": 94.99, "elapsed_time": "4:28:18", "remaining_time": "0:14:08", "throughput": 4082.94, "total_tokens": 65727376} +{"current_steps": 113390, "total_steps": 119360, "loss": 0.2844, "lr": 7.603742846522821e-08, "epoch": 18.99966487935657, "percentage": 95.0, "elapsed_time": "4:28:18", "remaining_time": "0:14:07", "throughput": 4082.95, "total_tokens": 65730512} +{"current_steps": 113395, "total_steps": 119360, "loss": 0.285, "lr": 7.591046031136085e-08, "epoch": 19.00050268096515, "percentage": 95.0, "elapsed_time": "4:28:19", "remaining_time": "0:14:06", "throughput": 4082.92, "total_tokens": 65733048} +{"current_steps": 113400, "total_steps": 119360, "loss": 0.2685, "lr": 7.578359744165819e-08, "epoch": 19.001340482573728, "percentage": 95.01, "elapsed_time": "4:28:20", "remaining_time": "0:14:06", "throughput": 4082.92, "total_tokens": 65735832} +{"current_steps": 113405, "total_steps": 119360, "loss": 0.2149, "lr": 7.565683985883254e-08, "epoch": 19.002178284182307, "percentage": 95.01, "elapsed_time": "4:28:20", "remaining_time": "0:14:05", "throughput": 4082.93, "total_tokens": 65738616} +{"current_steps": 113410, "total_steps": 119360, "loss": 0.2667, "lr": 7.553018756559449e-08, "epoch": 19.003016085790886, "percentage": 95.02, "elapsed_time": "4:28:21", "remaining_time": "0:14:04", "throughput": 4082.94, "total_tokens": 65741816} +{"current_steps": 113415, "total_steps": 119360, "loss": 0.3574, "lr": 7.540364056465188e-08, "epoch": 19.003853887399465, "percentage": 95.02, "elapsed_time": "4:28:22", "remaining_time": "0:14:04", "throughput": 4082.95, "total_tokens": 65744920} +{"current_steps": 113420, "total_steps": 119360, "loss": 0.3842, "lr": 7.527719885871088e-08, "epoch": 19.004691689008045, "percentage": 95.02, "elapsed_time": "4:28:22", "remaining_time": "0:14:03", "throughput": 4082.95, "total_tokens": 65747640} +{"current_steps": 113425, "total_steps": 119360, "loss": 0.2445, "lr": 7.515086245047376e-08, "epoch": 19.00552949061662, "percentage": 95.03, "elapsed_time": "4:28:23", "remaining_time": "0:14:02", "throughput": 4082.96, "total_tokens": 65750552} +{"current_steps": 113430, "total_steps": 119360, "loss": 0.3255, "lr": 7.502463134264392e-08, "epoch": 19.0063672922252, "percentage": 95.03, "elapsed_time": "4:28:24", "remaining_time": "0:14:01", "throughput": 4082.97, "total_tokens": 65753336} +{"current_steps": 113435, "total_steps": 119360, "loss": 0.5712, "lr": 7.489850553791811e-08, "epoch": 19.00720509383378, "percentage": 95.04, "elapsed_time": "4:28:24", "remaining_time": "0:14:01", "throughput": 4082.97, "total_tokens": 65755992} +{"current_steps": 113440, "total_steps": 119360, "loss": 0.4786, "lr": 7.477248503899359e-08, "epoch": 19.008042895442358, "percentage": 95.04, "elapsed_time": "4:28:25", "remaining_time": "0:14:00", "throughput": 4082.98, "total_tokens": 65758776} +{"current_steps": 113445, "total_steps": 119360, "loss": 0.2959, "lr": 7.4646569848566e-08, "epoch": 19.008880697050937, "percentage": 95.04, "elapsed_time": "4:28:26", "remaining_time": "0:13:59", "throughput": 4082.99, "total_tokens": 65761624} +{"current_steps": 113450, "total_steps": 119360, "loss": 0.3004, "lr": 7.45207599693265e-08, "epoch": 19.009718498659517, "percentage": 95.05, "elapsed_time": "4:28:26", "remaining_time": "0:13:59", "throughput": 4083.01, "total_tokens": 65764888} +{"current_steps": 113455, "total_steps": 119360, "loss": 0.206, "lr": 7.439505540396575e-08, "epoch": 19.010556300268096, "percentage": 95.05, "elapsed_time": "4:28:27", "remaining_time": "0:13:58", "throughput": 4083.02, "total_tokens": 65767704} +{"current_steps": 113460, "total_steps": 119360, "loss": 0.3688, "lr": 7.426945615517101e-08, "epoch": 19.011394101876675, "percentage": 95.06, "elapsed_time": "4:28:28", "remaining_time": "0:13:57", "throughput": 4083.03, "total_tokens": 65770648} +{"current_steps": 113465, "total_steps": 119360, "loss": 0.2782, "lr": 7.414396222562792e-08, "epoch": 19.012231903485254, "percentage": 95.06, "elapsed_time": "4:28:28", "remaining_time": "0:13:56", "throughput": 4083.04, "total_tokens": 65773528} +{"current_steps": 113470, "total_steps": 119360, "loss": 0.3029, "lr": 7.401857361801989e-08, "epoch": 19.013069705093834, "percentage": 95.07, "elapsed_time": "4:28:29", "remaining_time": "0:13:56", "throughput": 4083.05, "total_tokens": 65776696} +{"current_steps": 113475, "total_steps": 119360, "loss": 0.2347, "lr": 7.389329033502812e-08, "epoch": 19.013907506702413, "percentage": 95.07, "elapsed_time": "4:28:30", "remaining_time": "0:13:55", "throughput": 4083.06, "total_tokens": 65779736} +{"current_steps": 113480, "total_steps": 119360, "loss": 0.2596, "lr": 7.376811237933046e-08, "epoch": 19.014745308310992, "percentage": 95.07, "elapsed_time": "4:28:31", "remaining_time": "0:13:54", "throughput": 4083.07, "total_tokens": 65782552} +{"current_steps": 113485, "total_steps": 119360, "loss": 0.4156, "lr": 7.364303975360365e-08, "epoch": 19.01558310991957, "percentage": 95.08, "elapsed_time": "4:28:31", "remaining_time": "0:13:54", "throughput": 4083.08, "total_tokens": 65785496} +{"current_steps": 113490, "total_steps": 119360, "loss": 0.2151, "lr": 7.351807246052334e-08, "epoch": 19.01642091152815, "percentage": 95.08, "elapsed_time": "4:28:32", "remaining_time": "0:13:53", "throughput": 4083.09, "total_tokens": 65788184} +{"current_steps": 113495, "total_steps": 119360, "loss": 0.2634, "lr": 7.33932105027596e-08, "epoch": 19.01725871313673, "percentage": 95.09, "elapsed_time": "4:28:33", "remaining_time": "0:13:52", "throughput": 4083.1, "total_tokens": 65791224} +{"current_steps": 113500, "total_steps": 119360, "loss": 0.5222, "lr": 7.32684538829831e-08, "epoch": 19.01809651474531, "percentage": 95.09, "elapsed_time": "4:28:33", "remaining_time": "0:13:51", "throughput": 4083.11, "total_tokens": 65794232} +{"current_steps": 113505, "total_steps": 119360, "loss": 0.2102, "lr": 7.314380260386111e-08, "epoch": 19.01893431635389, "percentage": 95.09, "elapsed_time": "4:28:34", "remaining_time": "0:13:51", "throughput": 4083.13, "total_tokens": 65797368} +{"current_steps": 113510, "total_steps": 119360, "loss": 0.1974, "lr": 7.301925666805931e-08, "epoch": 19.019772117962468, "percentage": 95.1, "elapsed_time": "4:28:35", "remaining_time": "0:13:50", "throughput": 4083.14, "total_tokens": 65800280} +{"current_steps": 113515, "total_steps": 119360, "loss": 0.4608, "lr": 7.289481607824001e-08, "epoch": 19.020609919571047, "percentage": 95.1, "elapsed_time": "4:28:35", "remaining_time": "0:13:49", "throughput": 4083.15, "total_tokens": 65803160} +{"current_steps": 113520, "total_steps": 119360, "loss": 0.4116, "lr": 7.277048083706384e-08, "epoch": 19.021447721179623, "percentage": 95.11, "elapsed_time": "4:28:36", "remaining_time": "0:13:49", "throughput": 4083.16, "total_tokens": 65806328} +{"current_steps": 113525, "total_steps": 119360, "loss": 0.1689, "lr": 7.264625094719035e-08, "epoch": 19.022285522788202, "percentage": 95.11, "elapsed_time": "4:28:37", "remaining_time": "0:13:48", "throughput": 4083.17, "total_tokens": 65809624} +{"current_steps": 113530, "total_steps": 119360, "loss": 0.4323, "lr": 7.252212641127465e-08, "epoch": 19.02312332439678, "percentage": 95.12, "elapsed_time": "4:28:37", "remaining_time": "0:13:47", "throughput": 4083.18, "total_tokens": 65812472} +{"current_steps": 113535, "total_steps": 119360, "loss": 0.4337, "lr": 7.239810723197128e-08, "epoch": 19.02396112600536, "percentage": 95.12, "elapsed_time": "4:28:38", "remaining_time": "0:13:46", "throughput": 4083.19, "total_tokens": 65815224} +{"current_steps": 113540, "total_steps": 119360, "loss": 0.2381, "lr": 7.227419341193142e-08, "epoch": 19.02479892761394, "percentage": 95.12, "elapsed_time": "4:28:39", "remaining_time": "0:13:46", "throughput": 4083.19, "total_tokens": 65818104} +{"current_steps": 113545, "total_steps": 119360, "loss": 0.257, "lr": 7.215038495380466e-08, "epoch": 19.02563672922252, "percentage": 95.13, "elapsed_time": "4:28:39", "remaining_time": "0:13:45", "throughput": 4083.2, "total_tokens": 65820984} +{"current_steps": 113550, "total_steps": 119360, "loss": 0.2625, "lr": 7.202668186023942e-08, "epoch": 19.0264745308311, "percentage": 95.13, "elapsed_time": "4:28:40", "remaining_time": "0:13:44", "throughput": 4083.21, "total_tokens": 65823832} +{"current_steps": 113555, "total_steps": 119360, "loss": 0.3991, "lr": 7.190308413387859e-08, "epoch": 19.027312332439678, "percentage": 95.14, "elapsed_time": "4:28:41", "remaining_time": "0:13:44", "throughput": 4083.22, "total_tokens": 65826872} +{"current_steps": 113560, "total_steps": 119360, "loss": 0.2191, "lr": 7.177959177736671e-08, "epoch": 19.028150134048257, "percentage": 95.14, "elapsed_time": "4:28:41", "remaining_time": "0:13:43", "throughput": 4083.23, "total_tokens": 65829560} +{"current_steps": 113565, "total_steps": 119360, "loss": 0.4277, "lr": 7.165620479334279e-08, "epoch": 19.028987935656836, "percentage": 95.14, "elapsed_time": "4:28:42", "remaining_time": "0:13:42", "throughput": 4083.23, "total_tokens": 65832472} +{"current_steps": 113570, "total_steps": 119360, "loss": 0.2411, "lr": 7.153292318444583e-08, "epoch": 19.029825737265416, "percentage": 95.15, "elapsed_time": "4:28:43", "remaining_time": "0:13:41", "throughput": 4083.23, "total_tokens": 65835000} +{"current_steps": 113575, "total_steps": 119360, "loss": 0.2238, "lr": 7.140974695331204e-08, "epoch": 19.030663538873995, "percentage": 95.15, "elapsed_time": "4:28:43", "remaining_time": "0:13:41", "throughput": 4083.25, "total_tokens": 65838232} +{"current_steps": 113580, "total_steps": 119360, "loss": 0.5316, "lr": 7.128667610257434e-08, "epoch": 19.031501340482574, "percentage": 95.16, "elapsed_time": "4:28:44", "remaining_time": "0:13:40", "throughput": 4083.26, "total_tokens": 65841400} +{"current_steps": 113585, "total_steps": 119360, "loss": 0.3778, "lr": 7.116371063486449e-08, "epoch": 19.032339142091153, "percentage": 95.16, "elapsed_time": "4:28:45", "remaining_time": "0:13:39", "throughput": 4083.27, "total_tokens": 65844344} +{"current_steps": 113590, "total_steps": 119360, "loss": 0.3036, "lr": 7.104085055281152e-08, "epoch": 19.033176943699733, "percentage": 95.17, "elapsed_time": "4:28:46", "remaining_time": "0:13:39", "throughput": 4083.28, "total_tokens": 65847288} +{"current_steps": 113595, "total_steps": 119360, "loss": 0.2653, "lr": 7.091809585904275e-08, "epoch": 19.034014745308312, "percentage": 95.17, "elapsed_time": "4:28:46", "remaining_time": "0:13:38", "throughput": 4083.28, "total_tokens": 65849976} +{"current_steps": 113600, "total_steps": 119360, "loss": 0.2892, "lr": 7.079544655618275e-08, "epoch": 19.03485254691689, "percentage": 95.17, "elapsed_time": "4:28:47", "remaining_time": "0:13:37", "throughput": 4083.3, "total_tokens": 65853048} +{"current_steps": 113605, "total_steps": 119360, "loss": 0.4601, "lr": 7.067290264685334e-08, "epoch": 19.03569034852547, "percentage": 95.18, "elapsed_time": "4:28:48", "remaining_time": "0:13:37", "throughput": 4083.3, "total_tokens": 65855736} +{"current_steps": 113610, "total_steps": 119360, "loss": 0.4956, "lr": 7.055046413367572e-08, "epoch": 19.03652815013405, "percentage": 95.18, "elapsed_time": "4:28:48", "remaining_time": "0:13:36", "throughput": 4083.32, "total_tokens": 65859000} +{"current_steps": 113615, "total_steps": 119360, "loss": 0.3335, "lr": 7.042813101926672e-08, "epoch": 19.03736595174263, "percentage": 95.19, "elapsed_time": "4:28:49", "remaining_time": "0:13:35", "throughput": 4083.32, "total_tokens": 65861752} +{"current_steps": 113620, "total_steps": 119360, "loss": 0.2606, "lr": 7.030590330624254e-08, "epoch": 19.038203753351205, "percentage": 95.19, "elapsed_time": "4:28:50", "remaining_time": "0:13:34", "throughput": 4083.33, "total_tokens": 65864504} +{"current_steps": 113625, "total_steps": 119360, "loss": 0.505, "lr": 7.018378099721723e-08, "epoch": 19.039041554959784, "percentage": 95.2, "elapsed_time": "4:28:50", "remaining_time": "0:13:34", "throughput": 4083.33, "total_tokens": 65867320} +{"current_steps": 113630, "total_steps": 119360, "loss": 0.2716, "lr": 7.006176409480036e-08, "epoch": 19.039879356568363, "percentage": 95.2, "elapsed_time": "4:28:51", "remaining_time": "0:13:33", "throughput": 4083.34, "total_tokens": 65870008} +{"current_steps": 113635, "total_steps": 119360, "loss": 0.2925, "lr": 6.993985260160208e-08, "epoch": 19.040717158176943, "percentage": 95.2, "elapsed_time": "4:28:52", "remaining_time": "0:13:32", "throughput": 4083.34, "total_tokens": 65872952} +{"current_steps": 113640, "total_steps": 119360, "loss": 0.0878, "lr": 6.981804652022917e-08, "epoch": 19.041554959785522, "percentage": 95.21, "elapsed_time": "4:28:52", "remaining_time": "0:13:32", "throughput": 4083.35, "total_tokens": 65875832} +{"current_steps": 113645, "total_steps": 119360, "loss": 0.2285, "lr": 6.969634585328511e-08, "epoch": 19.0423927613941, "percentage": 95.21, "elapsed_time": "4:28:53", "remaining_time": "0:13:31", "throughput": 4083.37, "total_tokens": 65879128} +{"current_steps": 113650, "total_steps": 119360, "loss": 0.3965, "lr": 6.957475060337171e-08, "epoch": 19.04323056300268, "percentage": 95.22, "elapsed_time": "4:28:54", "remaining_time": "0:13:30", "throughput": 4083.37, "total_tokens": 65881944} +{"current_steps": 113655, "total_steps": 119360, "loss": 0.2876, "lr": 6.945326077309078e-08, "epoch": 19.04406836461126, "percentage": 95.22, "elapsed_time": "4:28:54", "remaining_time": "0:13:29", "throughput": 4083.39, "total_tokens": 65884920} +{"current_steps": 113660, "total_steps": 119360, "loss": 0.2739, "lr": 6.933187636503858e-08, "epoch": 19.04490616621984, "percentage": 95.22, "elapsed_time": "4:28:55", "remaining_time": "0:13:29", "throughput": 4083.4, "total_tokens": 65887864} +{"current_steps": 113665, "total_steps": 119360, "loss": 0.2733, "lr": 6.921059738181024e-08, "epoch": 19.045743967828418, "percentage": 95.23, "elapsed_time": "4:28:56", "remaining_time": "0:13:28", "throughput": 4083.41, "total_tokens": 65891032} +{"current_steps": 113670, "total_steps": 119360, "loss": 0.4367, "lr": 6.908942382599981e-08, "epoch": 19.046581769436997, "percentage": 95.23, "elapsed_time": "4:28:56", "remaining_time": "0:13:27", "throughput": 4083.42, "total_tokens": 65893976} +{"current_steps": 113675, "total_steps": 119360, "loss": 0.4568, "lr": 6.896835570019745e-08, "epoch": 19.047419571045577, "percentage": 95.24, "elapsed_time": "4:28:57", "remaining_time": "0:13:27", "throughput": 4083.42, "total_tokens": 65896728} +{"current_steps": 113680, "total_steps": 119360, "loss": 0.3711, "lr": 6.884739300699161e-08, "epoch": 19.048257372654156, "percentage": 95.24, "elapsed_time": "4:28:58", "remaining_time": "0:13:26", "throughput": 4083.44, "total_tokens": 65899736} +{"current_steps": 113685, "total_steps": 119360, "loss": 0.3889, "lr": 6.87265357489697e-08, "epoch": 19.049095174262735, "percentage": 95.25, "elapsed_time": "4:28:58", "remaining_time": "0:13:25", "throughput": 4083.44, "total_tokens": 65902616} +{"current_steps": 113690, "total_steps": 119360, "loss": 0.4396, "lr": 6.860578392871464e-08, "epoch": 19.049932975871315, "percentage": 95.25, "elapsed_time": "4:28:59", "remaining_time": "0:13:24", "throughput": 4083.45, "total_tokens": 65905368} +{"current_steps": 113695, "total_steps": 119360, "loss": 0.1873, "lr": 6.848513754880881e-08, "epoch": 19.050770777479894, "percentage": 95.25, "elapsed_time": "4:29:00", "remaining_time": "0:13:24", "throughput": 4083.46, "total_tokens": 65908696} +{"current_steps": 113700, "total_steps": 119360, "loss": 0.2225, "lr": 6.836459661183237e-08, "epoch": 19.051608579088473, "percentage": 95.26, "elapsed_time": "4:29:01", "remaining_time": "0:13:23", "throughput": 4083.47, "total_tokens": 65911608} +{"current_steps": 113705, "total_steps": 119360, "loss": 0.3362, "lr": 6.824416112036158e-08, "epoch": 19.052446380697052, "percentage": 95.26, "elapsed_time": "4:29:01", "remaining_time": "0:13:22", "throughput": 4083.48, "total_tokens": 65914584} +{"current_steps": 113710, "total_steps": 119360, "loss": 0.2961, "lr": 6.812383107697218e-08, "epoch": 19.05328418230563, "percentage": 95.27, "elapsed_time": "4:29:02", "remaining_time": "0:13:22", "throughput": 4083.49, "total_tokens": 65917336} +{"current_steps": 113715, "total_steps": 119360, "loss": 0.3063, "lr": 6.80036064842371e-08, "epoch": 19.05412198391421, "percentage": 95.27, "elapsed_time": "4:29:03", "remaining_time": "0:13:21", "throughput": 4083.49, "total_tokens": 65920120} +{"current_steps": 113720, "total_steps": 119360, "loss": 0.4336, "lr": 6.788348734472594e-08, "epoch": 19.054959785522787, "percentage": 95.27, "elapsed_time": "4:29:03", "remaining_time": "0:13:20", "throughput": 4083.5, "total_tokens": 65922968} +{"current_steps": 113725, "total_steps": 119360, "loss": 0.2085, "lr": 6.776347366100833e-08, "epoch": 19.055797587131366, "percentage": 95.28, "elapsed_time": "4:29:04", "remaining_time": "0:13:19", "throughput": 4083.51, "total_tokens": 65925720} +{"current_steps": 113730, "total_steps": 119360, "loss": 0.2563, "lr": 6.764356543564943e-08, "epoch": 19.056635388739945, "percentage": 95.28, "elapsed_time": "4:29:05", "remaining_time": "0:13:19", "throughput": 4083.52, "total_tokens": 65928504} +{"current_steps": 113735, "total_steps": 119360, "loss": 0.2851, "lr": 6.75237626712133e-08, "epoch": 19.057473190348524, "percentage": 95.29, "elapsed_time": "4:29:05", "remaining_time": "0:13:18", "throughput": 4083.53, "total_tokens": 65931320} +{"current_steps": 113740, "total_steps": 119360, "loss": 0.2611, "lr": 6.740406537026179e-08, "epoch": 19.058310991957104, "percentage": 95.29, "elapsed_time": "4:29:06", "remaining_time": "0:13:17", "throughput": 4083.54, "total_tokens": 65934200} +{"current_steps": 113745, "total_steps": 119360, "loss": 0.5895, "lr": 6.72844735353545e-08, "epoch": 19.059148793565683, "percentage": 95.3, "elapsed_time": "4:29:07", "remaining_time": "0:13:17", "throughput": 4083.55, "total_tokens": 65937272} +{"current_steps": 113750, "total_steps": 119360, "loss": 0.5144, "lr": 6.716498716904718e-08, "epoch": 19.059986595174262, "percentage": 95.3, "elapsed_time": "4:29:07", "remaining_time": "0:13:16", "throughput": 4083.56, "total_tokens": 65940088} +{"current_steps": 113755, "total_steps": 119360, "loss": 0.3255, "lr": 6.704560627389556e-08, "epoch": 19.06082439678284, "percentage": 95.3, "elapsed_time": "4:29:08", "remaining_time": "0:13:15", "throughput": 4083.57, "total_tokens": 65942968} +{"current_steps": 113760, "total_steps": 119360, "loss": 0.4587, "lr": 6.692633085245203e-08, "epoch": 19.06166219839142, "percentage": 95.31, "elapsed_time": "4:29:09", "remaining_time": "0:13:14", "throughput": 4083.57, "total_tokens": 65945688} +{"current_steps": 113765, "total_steps": 119360, "loss": 0.4121, "lr": 6.68071609072668e-08, "epoch": 19.0625, "percentage": 95.31, "elapsed_time": "4:29:09", "remaining_time": "0:13:14", "throughput": 4083.58, "total_tokens": 65948696} +{"current_steps": 113770, "total_steps": 119360, "loss": 0.3931, "lr": 6.668809644088781e-08, "epoch": 19.06333780160858, "percentage": 95.32, "elapsed_time": "4:29:10", "remaining_time": "0:13:13", "throughput": 4083.6, "total_tokens": 65951736} +{"current_steps": 113775, "total_steps": 119360, "loss": 0.4008, "lr": 6.656913745586135e-08, "epoch": 19.06417560321716, "percentage": 95.32, "elapsed_time": "4:29:11", "remaining_time": "0:13:12", "throughput": 4083.6, "total_tokens": 65954328} +{"current_steps": 113780, "total_steps": 119360, "loss": 0.3746, "lr": 6.64502839547304e-08, "epoch": 19.065013404825738, "percentage": 95.33, "elapsed_time": "4:29:11", "remaining_time": "0:13:12", "throughput": 4083.61, "total_tokens": 65957400} +{"current_steps": 113785, "total_steps": 119360, "loss": 0.4165, "lr": 6.633153594003627e-08, "epoch": 19.065851206434317, "percentage": 95.33, "elapsed_time": "4:29:12", "remaining_time": "0:13:11", "throughput": 4083.63, "total_tokens": 65960440} +{"current_steps": 113790, "total_steps": 119360, "loss": 0.3137, "lr": 6.621289341431858e-08, "epoch": 19.066689008042896, "percentage": 95.33, "elapsed_time": "4:29:13", "remaining_time": "0:13:10", "throughput": 4083.63, "total_tokens": 65963096} +{"current_steps": 113795, "total_steps": 119360, "loss": 0.4645, "lr": 6.609435638011252e-08, "epoch": 19.067526809651476, "percentage": 95.34, "elapsed_time": "4:29:13", "remaining_time": "0:13:09", "throughput": 4083.64, "total_tokens": 65965752} +{"current_steps": 113800, "total_steps": 119360, "loss": 0.2361, "lr": 6.597592483995441e-08, "epoch": 19.068364611260055, "percentage": 95.34, "elapsed_time": "4:29:14", "remaining_time": "0:13:09", "throughput": 4083.65, "total_tokens": 65968824} +{"current_steps": 113805, "total_steps": 119360, "loss": 0.396, "lr": 6.585759879637609e-08, "epoch": 19.069202412868634, "percentage": 95.35, "elapsed_time": "4:29:15", "remaining_time": "0:13:08", "throughput": 4083.66, "total_tokens": 65972088} +{"current_steps": 113810, "total_steps": 119360, "loss": 0.3362, "lr": 6.573937825190613e-08, "epoch": 19.070040214477213, "percentage": 95.35, "elapsed_time": "4:29:15", "remaining_time": "0:13:07", "throughput": 4083.67, "total_tokens": 65974712} +{"current_steps": 113815, "total_steps": 119360, "loss": 0.2571, "lr": 6.562126320907358e-08, "epoch": 19.07087801608579, "percentage": 95.35, "elapsed_time": "4:29:16", "remaining_time": "0:13:07", "throughput": 4083.68, "total_tokens": 65977688} +{"current_steps": 113820, "total_steps": 119360, "loss": 0.5937, "lr": 6.550325367040422e-08, "epoch": 19.07171581769437, "percentage": 95.36, "elapsed_time": "4:29:17", "remaining_time": "0:13:06", "throughput": 4083.68, "total_tokens": 65980536} +{"current_steps": 113825, "total_steps": 119360, "loss": 0.2316, "lr": 6.538534963841991e-08, "epoch": 19.072553619302948, "percentage": 95.36, "elapsed_time": "4:29:17", "remaining_time": "0:13:05", "throughput": 4083.69, "total_tokens": 65983544} +{"current_steps": 113830, "total_steps": 119360, "loss": 0.2658, "lr": 6.526755111564309e-08, "epoch": 19.073391420911527, "percentage": 95.37, "elapsed_time": "4:29:18", "remaining_time": "0:13:04", "throughput": 4083.7, "total_tokens": 65986168} +{"current_steps": 113835, "total_steps": 119360, "loss": 0.3715, "lr": 6.514985810459118e-08, "epoch": 19.074229222520106, "percentage": 95.37, "elapsed_time": "4:29:19", "remaining_time": "0:13:04", "throughput": 4083.71, "total_tokens": 65989112} +{"current_steps": 113840, "total_steps": 119360, "loss": 0.2286, "lr": 6.503227060778105e-08, "epoch": 19.075067024128685, "percentage": 95.38, "elapsed_time": "4:29:19", "remaining_time": "0:13:03", "throughput": 4083.71, "total_tokens": 65991832} +{"current_steps": 113845, "total_steps": 119360, "loss": 0.217, "lr": 6.491478862772738e-08, "epoch": 19.075904825737265, "percentage": 95.38, "elapsed_time": "4:29:20", "remaining_time": "0:13:02", "throughput": 4083.72, "total_tokens": 65995000} +{"current_steps": 113850, "total_steps": 119360, "loss": 0.1392, "lr": 6.479741216694202e-08, "epoch": 19.076742627345844, "percentage": 95.38, "elapsed_time": "4:29:21", "remaining_time": "0:13:02", "throughput": 4083.74, "total_tokens": 65997912} +{"current_steps": 113855, "total_steps": 119360, "loss": 0.3722, "lr": 6.468014122793354e-08, "epoch": 19.077580428954423, "percentage": 95.39, "elapsed_time": "4:29:21", "remaining_time": "0:13:01", "throughput": 4083.75, "total_tokens": 66000856} +{"current_steps": 113860, "total_steps": 119360, "loss": 0.3904, "lr": 6.456297581321102e-08, "epoch": 19.078418230563003, "percentage": 95.39, "elapsed_time": "4:29:22", "remaining_time": "0:13:00", "throughput": 4083.76, "total_tokens": 66003800} +{"current_steps": 113865, "total_steps": 119360, "loss": 0.1814, "lr": 6.44459159252786e-08, "epoch": 19.079256032171582, "percentage": 95.4, "elapsed_time": "4:29:23", "remaining_time": "0:13:00", "throughput": 4083.78, "total_tokens": 66006904} +{"current_steps": 113870, "total_steps": 119360, "loss": 0.6007, "lr": 6.432896156663926e-08, "epoch": 19.08009383378016, "percentage": 95.4, "elapsed_time": "4:29:23", "remaining_time": "0:12:59", "throughput": 4083.78, "total_tokens": 66009752} +{"current_steps": 113875, "total_steps": 119360, "loss": 0.2038, "lr": 6.421211273979322e-08, "epoch": 19.08093163538874, "percentage": 95.4, "elapsed_time": "4:29:24", "remaining_time": "0:12:58", "throughput": 4083.79, "total_tokens": 66012504} +{"current_steps": 113880, "total_steps": 119360, "loss": 0.2396, "lr": 6.409536944724071e-08, "epoch": 19.08176943699732, "percentage": 95.41, "elapsed_time": "4:29:25", "remaining_time": "0:12:57", "throughput": 4083.79, "total_tokens": 66015288} +{"current_steps": 113885, "total_steps": 119360, "loss": 0.4457, "lr": 6.397873169147583e-08, "epoch": 19.0826072386059, "percentage": 95.41, "elapsed_time": "4:29:25", "remaining_time": "0:12:57", "throughput": 4083.8, "total_tokens": 66018040} +{"current_steps": 113890, "total_steps": 119360, "loss": 0.4168, "lr": 6.386219947499329e-08, "epoch": 19.083445040214478, "percentage": 95.42, "elapsed_time": "4:29:26", "remaining_time": "0:12:56", "throughput": 4083.81, "total_tokens": 66020792} +{"current_steps": 113895, "total_steps": 119360, "loss": 0.2187, "lr": 6.374577280028438e-08, "epoch": 19.084282841823057, "percentage": 95.42, "elapsed_time": "4:29:27", "remaining_time": "0:12:55", "throughput": 4083.82, "total_tokens": 66023960} +{"current_steps": 113900, "total_steps": 119360, "loss": 0.2869, "lr": 6.362945166983936e-08, "epoch": 19.085120643431637, "percentage": 95.43, "elapsed_time": "4:29:27", "remaining_time": "0:12:55", "throughput": 4083.84, "total_tokens": 66027032} +{"current_steps": 113905, "total_steps": 119360, "loss": 0.2129, "lr": 6.351323608614401e-08, "epoch": 19.085958445040216, "percentage": 95.43, "elapsed_time": "4:29:28", "remaining_time": "0:12:54", "throughput": 4083.84, "total_tokens": 66029912} +{"current_steps": 113910, "total_steps": 119360, "loss": 0.4962, "lr": 6.339712605168468e-08, "epoch": 19.086796246648795, "percentage": 95.43, "elapsed_time": "4:29:29", "remaining_time": "0:12:53", "throughput": 4083.85, "total_tokens": 66032760} +{"current_steps": 113915, "total_steps": 119360, "loss": 0.258, "lr": 6.328112156894272e-08, "epoch": 19.08763404825737, "percentage": 95.44, "elapsed_time": "4:29:29", "remaining_time": "0:12:52", "throughput": 4083.86, "total_tokens": 66035544} +{"current_steps": 113920, "total_steps": 119360, "loss": 0.252, "lr": 6.316522264039892e-08, "epoch": 19.08847184986595, "percentage": 95.44, "elapsed_time": "4:29:30", "remaining_time": "0:12:52", "throughput": 4083.87, "total_tokens": 66038712} +{"current_steps": 113925, "total_steps": 119360, "loss": 0.2937, "lr": 6.304942926853186e-08, "epoch": 19.08930965147453, "percentage": 95.45, "elapsed_time": "4:29:31", "remaining_time": "0:12:51", "throughput": 4083.88, "total_tokens": 66041400} +{"current_steps": 113930, "total_steps": 119360, "loss": 0.4232, "lr": 6.293374145581676e-08, "epoch": 19.09014745308311, "percentage": 95.45, "elapsed_time": "4:29:31", "remaining_time": "0:12:50", "throughput": 4083.88, "total_tokens": 66044152} +{"current_steps": 113935, "total_steps": 119360, "loss": 0.337, "lr": 6.281815920472722e-08, "epoch": 19.090985254691688, "percentage": 95.45, "elapsed_time": "4:29:32", "remaining_time": "0:12:50", "throughput": 4083.89, "total_tokens": 66046936} +{"current_steps": 113940, "total_steps": 119360, "loss": 0.4627, "lr": 6.27026825177346e-08, "epoch": 19.091823056300267, "percentage": 95.46, "elapsed_time": "4:29:33", "remaining_time": "0:12:49", "throughput": 4083.9, "total_tokens": 66049848} +{"current_steps": 113945, "total_steps": 119360, "loss": 0.2347, "lr": 6.258731139730855e-08, "epoch": 19.092660857908847, "percentage": 95.46, "elapsed_time": "4:29:33", "remaining_time": "0:12:48", "throughput": 4083.91, "total_tokens": 66052792} +{"current_steps": 113950, "total_steps": 119360, "loss": 0.328, "lr": 6.247204584591493e-08, "epoch": 19.093498659517426, "percentage": 95.47, "elapsed_time": "4:29:34", "remaining_time": "0:12:47", "throughput": 4083.91, "total_tokens": 66055320} +{"current_steps": 113955, "total_steps": 119360, "loss": 0.4561, "lr": 6.23568858660184e-08, "epoch": 19.094336461126005, "percentage": 95.47, "elapsed_time": "4:29:35", "remaining_time": "0:12:47", "throughput": 4083.92, "total_tokens": 66058360} +{"current_steps": 113960, "total_steps": 119360, "loss": 0.3679, "lr": 6.2241831460082e-08, "epoch": 19.095174262734584, "percentage": 95.48, "elapsed_time": "4:29:35", "remaining_time": "0:12:46", "throughput": 4083.93, "total_tokens": 66061400} +{"current_steps": 113965, "total_steps": 119360, "loss": 0.4844, "lr": 6.212688263056544e-08, "epoch": 19.096012064343164, "percentage": 95.48, "elapsed_time": "4:29:36", "remaining_time": "0:12:45", "throughput": 4083.95, "total_tokens": 66064600} +{"current_steps": 113970, "total_steps": 119360, "loss": 0.2471, "lr": 6.201203937992672e-08, "epoch": 19.096849865951743, "percentage": 95.48, "elapsed_time": "4:29:37", "remaining_time": "0:12:45", "throughput": 4083.96, "total_tokens": 66067672} +{"current_steps": 113975, "total_steps": 119360, "loss": 0.1801, "lr": 6.189730171062059e-08, "epoch": 19.097687667560322, "percentage": 95.49, "elapsed_time": "4:29:38", "remaining_time": "0:12:44", "throughput": 4083.97, "total_tokens": 66070520} +{"current_steps": 113980, "total_steps": 119360, "loss": 0.4564, "lr": 6.178266962510004e-08, "epoch": 19.0985254691689, "percentage": 95.49, "elapsed_time": "4:29:38", "remaining_time": "0:12:43", "throughput": 4083.98, "total_tokens": 66073496} +{"current_steps": 113985, "total_steps": 119360, "loss": 0.4226, "lr": 6.16681431258176e-08, "epoch": 19.09936327077748, "percentage": 95.5, "elapsed_time": "4:29:39", "remaining_time": "0:12:42", "throughput": 4084.0, "total_tokens": 66076536} +{"current_steps": 113990, "total_steps": 119360, "loss": 0.2211, "lr": 6.155372221522127e-08, "epoch": 19.10020107238606, "percentage": 95.5, "elapsed_time": "4:29:40", "remaining_time": "0:12:42", "throughput": 4084.01, "total_tokens": 66079512} +{"current_steps": 113995, "total_steps": 119360, "loss": 0.6173, "lr": 6.143940689575689e-08, "epoch": 19.10103887399464, "percentage": 95.51, "elapsed_time": "4:29:40", "remaining_time": "0:12:41", "throughput": 4084.01, "total_tokens": 66082200} +{"current_steps": 114000, "total_steps": 119360, "loss": 0.3978, "lr": 6.132519716986973e-08, "epoch": 19.10187667560322, "percentage": 95.51, "elapsed_time": "4:29:41", "remaining_time": "0:12:40", "throughput": 4084.02, "total_tokens": 66085112} +{"current_steps": 114005, "total_steps": 119360, "loss": 0.0541, "lr": 6.121109304000061e-08, "epoch": 19.102714477211798, "percentage": 95.51, "elapsed_time": "4:29:42", "remaining_time": "0:12:40", "throughput": 4084.03, "total_tokens": 66087896} +{"current_steps": 114010, "total_steps": 119360, "loss": 0.2904, "lr": 6.109709450859036e-08, "epoch": 19.103552278820377, "percentage": 95.52, "elapsed_time": "4:29:42", "remaining_time": "0:12:39", "throughput": 4084.03, "total_tokens": 66090648} +{"current_steps": 114015, "total_steps": 119360, "loss": 0.4259, "lr": 6.098320157807647e-08, "epoch": 19.104390080428953, "percentage": 95.52, "elapsed_time": "4:29:43", "remaining_time": "0:12:38", "throughput": 4084.03, "total_tokens": 66093304} +{"current_steps": 114020, "total_steps": 119360, "loss": 0.3261, "lr": 6.086941425089254e-08, "epoch": 19.105227882037532, "percentage": 95.53, "elapsed_time": "4:29:44", "remaining_time": "0:12:37", "throughput": 4084.04, "total_tokens": 66096152} +{"current_steps": 114025, "total_steps": 119360, "loss": 0.3247, "lr": 6.07557325294733e-08, "epoch": 19.10606568364611, "percentage": 95.53, "elapsed_time": "4:29:44", "remaining_time": "0:12:37", "throughput": 4084.06, "total_tokens": 66099192} +{"current_steps": 114030, "total_steps": 119360, "loss": 0.1902, "lr": 6.064215641624904e-08, "epoch": 19.10690348525469, "percentage": 95.53, "elapsed_time": "4:29:45", "remaining_time": "0:12:36", "throughput": 4084.07, "total_tokens": 66102296} +{"current_steps": 114035, "total_steps": 119360, "loss": 0.3945, "lr": 6.052868591364724e-08, "epoch": 19.10774128686327, "percentage": 95.54, "elapsed_time": "4:29:46", "remaining_time": "0:12:35", "throughput": 4084.08, "total_tokens": 66105144} +{"current_steps": 114040, "total_steps": 119360, "loss": 0.2199, "lr": 6.041532102409486e-08, "epoch": 19.10857908847185, "percentage": 95.54, "elapsed_time": "4:29:46", "remaining_time": "0:12:35", "throughput": 4084.08, "total_tokens": 66107832} +{"current_steps": 114045, "total_steps": 119360, "loss": 0.4478, "lr": 6.030206175001607e-08, "epoch": 19.10941689008043, "percentage": 95.55, "elapsed_time": "4:29:47", "remaining_time": "0:12:34", "throughput": 4084.08, "total_tokens": 66110392} +{"current_steps": 114050, "total_steps": 119360, "loss": 0.1106, "lr": 6.018890809383171e-08, "epoch": 19.110254691689008, "percentage": 95.55, "elapsed_time": "4:29:47", "remaining_time": "0:12:33", "throughput": 4084.09, "total_tokens": 66113208} +{"current_steps": 114055, "total_steps": 119360, "loss": 0.6019, "lr": 6.007586005796151e-08, "epoch": 19.111092493297587, "percentage": 95.56, "elapsed_time": "4:29:48", "remaining_time": "0:12:32", "throughput": 4084.1, "total_tokens": 66116216} +{"current_steps": 114060, "total_steps": 119360, "loss": 0.5043, "lr": 5.996291764482242e-08, "epoch": 19.111930294906166, "percentage": 95.56, "elapsed_time": "4:29:49", "remaining_time": "0:12:32", "throughput": 4084.11, "total_tokens": 66119032} +{"current_steps": 114065, "total_steps": 119360, "loss": 0.4738, "lr": 5.985008085683031e-08, "epoch": 19.112768096514746, "percentage": 95.56, "elapsed_time": "4:29:50", "remaining_time": "0:12:31", "throughput": 4084.12, "total_tokens": 66122008} +{"current_steps": 114070, "total_steps": 119360, "loss": 0.2256, "lr": 5.9737349696396e-08, "epoch": 19.113605898123325, "percentage": 95.57, "elapsed_time": "4:29:50", "remaining_time": "0:12:30", "throughput": 4084.13, "total_tokens": 66124824} +{"current_steps": 114075, "total_steps": 119360, "loss": 0.7128, "lr": 5.962472416593202e-08, "epoch": 19.114443699731904, "percentage": 95.57, "elapsed_time": "4:29:51", "remaining_time": "0:12:30", "throughput": 4084.14, "total_tokens": 66127704} +{"current_steps": 114080, "total_steps": 119360, "loss": 0.3006, "lr": 5.951220426784421e-08, "epoch": 19.115281501340483, "percentage": 95.58, "elapsed_time": "4:29:52", "remaining_time": "0:12:29", "throughput": 4084.15, "total_tokens": 66130840} +{"current_steps": 114085, "total_steps": 119360, "loss": 0.3885, "lr": 5.9399790004540105e-08, "epoch": 19.116119302949063, "percentage": 95.58, "elapsed_time": "4:29:52", "remaining_time": "0:12:28", "throughput": 4084.17, "total_tokens": 66133944} +{"current_steps": 114090, "total_steps": 119360, "loss": 0.2593, "lr": 5.9287481378422773e-08, "epoch": 19.116957104557642, "percentage": 95.58, "elapsed_time": "4:29:53", "remaining_time": "0:12:27", "throughput": 4084.18, "total_tokens": 66136696} +{"current_steps": 114095, "total_steps": 119360, "loss": 0.2847, "lr": 5.917527839189363e-08, "epoch": 19.11779490616622, "percentage": 95.59, "elapsed_time": "4:29:54", "remaining_time": "0:12:27", "throughput": 4084.19, "total_tokens": 66139672} +{"current_steps": 114100, "total_steps": 119360, "loss": 0.1538, "lr": 5.906318104735076e-08, "epoch": 19.1186327077748, "percentage": 95.59, "elapsed_time": "4:29:54", "remaining_time": "0:12:26", "throughput": 4084.19, "total_tokens": 66142392} +{"current_steps": 114105, "total_steps": 119360, "loss": 0.1619, "lr": 5.895118934719224e-08, "epoch": 19.11947050938338, "percentage": 95.6, "elapsed_time": "4:29:55", "remaining_time": "0:12:25", "throughput": 4084.2, "total_tokens": 66145400} +{"current_steps": 114110, "total_steps": 119360, "loss": 0.1832, "lr": 5.8839303293812266e-08, "epoch": 19.120308310991955, "percentage": 95.6, "elapsed_time": "4:29:56", "remaining_time": "0:12:25", "throughput": 4084.21, "total_tokens": 66148152} +{"current_steps": 114115, "total_steps": 119360, "loss": 0.2818, "lr": 5.872752288960282e-08, "epoch": 19.121146112600535, "percentage": 95.61, "elapsed_time": "4:29:56", "remaining_time": "0:12:24", "throughput": 4084.23, "total_tokens": 66151224} +{"current_steps": 114120, "total_steps": 119360, "loss": 0.2469, "lr": 5.86158481369542e-08, "epoch": 19.121983914209114, "percentage": 95.61, "elapsed_time": "4:29:57", "remaining_time": "0:12:23", "throughput": 4084.23, "total_tokens": 66154040} +{"current_steps": 114125, "total_steps": 119360, "loss": 0.2635, "lr": 5.850427903825395e-08, "epoch": 19.122821715817693, "percentage": 95.61, "elapsed_time": "4:29:58", "remaining_time": "0:12:23", "throughput": 4084.23, "total_tokens": 66156824} +{"current_steps": 114130, "total_steps": 119360, "loss": 0.3321, "lr": 5.839281559588794e-08, "epoch": 19.123659517426272, "percentage": 95.62, "elapsed_time": "4:29:58", "remaining_time": "0:12:22", "throughput": 4084.24, "total_tokens": 66159736} +{"current_steps": 114135, "total_steps": 119360, "loss": 0.2578, "lr": 5.8281457812239263e-08, "epoch": 19.12449731903485, "percentage": 95.62, "elapsed_time": "4:29:59", "remaining_time": "0:12:21", "throughput": 4084.25, "total_tokens": 66162616} +{"current_steps": 114140, "total_steps": 119360, "loss": 0.4612, "lr": 5.817020568968879e-08, "epoch": 19.12533512064343, "percentage": 95.63, "elapsed_time": "4:30:00", "remaining_time": "0:12:20", "throughput": 4084.26, "total_tokens": 66165528} +{"current_steps": 114145, "total_steps": 119360, "loss": 0.4333, "lr": 5.805905923061461e-08, "epoch": 19.12617292225201, "percentage": 95.63, "elapsed_time": "4:30:00", "remaining_time": "0:12:20", "throughput": 4084.27, "total_tokens": 66168312} +{"current_steps": 114150, "total_steps": 119360, "loss": 0.2616, "lr": 5.794801843739484e-08, "epoch": 19.12701072386059, "percentage": 95.64, "elapsed_time": "4:30:01", "remaining_time": "0:12:19", "throughput": 4084.28, "total_tokens": 66171064} +{"current_steps": 114155, "total_steps": 119360, "loss": 0.3327, "lr": 5.783708331240201e-08, "epoch": 19.12784852546917, "percentage": 95.64, "elapsed_time": "4:30:02", "remaining_time": "0:12:18", "throughput": 4084.29, "total_tokens": 66174040} +{"current_steps": 114160, "total_steps": 119360, "loss": 0.3921, "lr": 5.772625385800923e-08, "epoch": 19.128686327077748, "percentage": 95.64, "elapsed_time": "4:30:02", "remaining_time": "0:12:18", "throughput": 4084.29, "total_tokens": 66176888} +{"current_steps": 114165, "total_steps": 119360, "loss": 0.5472, "lr": 5.7615530076585715e-08, "epoch": 19.129524128686327, "percentage": 95.65, "elapsed_time": "4:30:03", "remaining_time": "0:12:17", "throughput": 4084.3, "total_tokens": 66179672} +{"current_steps": 114170, "total_steps": 119360, "loss": 0.331, "lr": 5.750491197049901e-08, "epoch": 19.130361930294907, "percentage": 95.65, "elapsed_time": "4:30:04", "remaining_time": "0:12:16", "throughput": 4084.3, "total_tokens": 66182392} +{"current_steps": 114175, "total_steps": 119360, "loss": 0.367, "lr": 5.73943995421139e-08, "epoch": 19.131199731903486, "percentage": 95.66, "elapsed_time": "4:30:04", "remaining_time": "0:12:15", "throughput": 4084.31, "total_tokens": 66185272} +{"current_steps": 114180, "total_steps": 119360, "loss": 0.4263, "lr": 5.7283992793794044e-08, "epoch": 19.132037533512065, "percentage": 95.66, "elapsed_time": "4:30:05", "remaining_time": "0:12:15", "throughput": 4084.32, "total_tokens": 66188088} +{"current_steps": 114185, "total_steps": 119360, "loss": 0.2238, "lr": 5.7173691727899216e-08, "epoch": 19.132875335120644, "percentage": 95.66, "elapsed_time": "4:30:06", "remaining_time": "0:12:14", "throughput": 4084.33, "total_tokens": 66190904} +{"current_steps": 114190, "total_steps": 119360, "loss": 0.3583, "lr": 5.706349634678865e-08, "epoch": 19.133713136729224, "percentage": 95.67, "elapsed_time": "4:30:06", "remaining_time": "0:12:13", "throughput": 4084.34, "total_tokens": 66193784} +{"current_steps": 114195, "total_steps": 119360, "loss": 0.2503, "lr": 5.6953406652818236e-08, "epoch": 19.134550938337803, "percentage": 95.67, "elapsed_time": "4:30:07", "remaining_time": "0:12:13", "throughput": 4084.35, "total_tokens": 66196952} +{"current_steps": 114200, "total_steps": 119360, "loss": 0.1987, "lr": 5.684342264834164e-08, "epoch": 19.135388739946382, "percentage": 95.68, "elapsed_time": "4:30:08", "remaining_time": "0:12:12", "throughput": 4084.36, "total_tokens": 66200216} +{"current_steps": 114205, "total_steps": 119360, "loss": 0.4665, "lr": 5.673354433571032e-08, "epoch": 19.13622654155496, "percentage": 95.68, "elapsed_time": "4:30:08", "remaining_time": "0:12:11", "throughput": 4084.37, "total_tokens": 66203096} +{"current_steps": 114210, "total_steps": 119360, "loss": 0.2828, "lr": 5.6623771717274065e-08, "epoch": 19.137064343163537, "percentage": 95.69, "elapsed_time": "4:30:09", "remaining_time": "0:12:10", "throughput": 4084.38, "total_tokens": 66206200} +{"current_steps": 114215, "total_steps": 119360, "loss": 0.406, "lr": 5.6514104795379885e-08, "epoch": 19.137902144772116, "percentage": 95.69, "elapsed_time": "4:30:10", "remaining_time": "0:12:10", "throughput": 4084.38, "total_tokens": 66209080} +{"current_steps": 114220, "total_steps": 119360, "loss": 0.4904, "lr": 5.640454357237257e-08, "epoch": 19.138739946380696, "percentage": 95.69, "elapsed_time": "4:30:10", "remaining_time": "0:12:09", "throughput": 4084.39, "total_tokens": 66211832} +{"current_steps": 114225, "total_steps": 119360, "loss": 0.6042, "lr": 5.6295088050594135e-08, "epoch": 19.139577747989275, "percentage": 95.7, "elapsed_time": "4:30:11", "remaining_time": "0:12:08", "throughput": 4084.41, "total_tokens": 66214808} +{"current_steps": 114230, "total_steps": 119360, "loss": 0.5192, "lr": 5.6185738232386044e-08, "epoch": 19.140415549597854, "percentage": 95.7, "elapsed_time": "4:30:12", "remaining_time": "0:12:08", "throughput": 4084.41, "total_tokens": 66217304} +{"current_steps": 114235, "total_steps": 119360, "loss": 0.3463, "lr": 5.6076494120085314e-08, "epoch": 19.141253351206434, "percentage": 95.71, "elapsed_time": "4:30:12", "remaining_time": "0:12:07", "throughput": 4084.41, "total_tokens": 66220184} +{"current_steps": 114240, "total_steps": 119360, "loss": 0.3533, "lr": 5.59673557160284e-08, "epoch": 19.142091152815013, "percentage": 95.71, "elapsed_time": "4:30:13", "remaining_time": "0:12:06", "throughput": 4084.42, "total_tokens": 66222904} +{"current_steps": 114245, "total_steps": 119360, "loss": 0.323, "lr": 5.585832302254846e-08, "epoch": 19.142928954423592, "percentage": 95.71, "elapsed_time": "4:30:14", "remaining_time": "0:12:05", "throughput": 4084.43, "total_tokens": 66225688} +{"current_steps": 114250, "total_steps": 119360, "loss": 0.2979, "lr": 5.5749396041976934e-08, "epoch": 19.14376675603217, "percentage": 95.72, "elapsed_time": "4:30:14", "remaining_time": "0:12:05", "throughput": 4084.44, "total_tokens": 66228568} +{"current_steps": 114255, "total_steps": 119360, "loss": 0.0952, "lr": 5.5640574776643085e-08, "epoch": 19.14460455764075, "percentage": 95.72, "elapsed_time": "4:30:15", "remaining_time": "0:12:04", "throughput": 4084.45, "total_tokens": 66231704} +{"current_steps": 114260, "total_steps": 119360, "loss": 0.153, "lr": 5.553185922887283e-08, "epoch": 19.14544235924933, "percentage": 95.73, "elapsed_time": "4:30:16", "remaining_time": "0:12:03", "throughput": 4084.47, "total_tokens": 66234808} +{"current_steps": 114265, "total_steps": 119360, "loss": 0.2346, "lr": 5.542324940099153e-08, "epoch": 19.14628016085791, "percentage": 95.73, "elapsed_time": "4:30:16", "remaining_time": "0:12:03", "throughput": 4084.48, "total_tokens": 66237912} +{"current_steps": 114270, "total_steps": 119360, "loss": 0.1974, "lr": 5.531474529532122e-08, "epoch": 19.14711796246649, "percentage": 95.74, "elapsed_time": "4:30:17", "remaining_time": "0:12:02", "throughput": 4084.48, "total_tokens": 66240632} +{"current_steps": 114275, "total_steps": 119360, "loss": 0.1624, "lr": 5.52063469141817e-08, "epoch": 19.147955764075068, "percentage": 95.74, "elapsed_time": "4:30:18", "remaining_time": "0:12:01", "throughput": 4084.49, "total_tokens": 66243736} +{"current_steps": 114280, "total_steps": 119360, "loss": 0.3127, "lr": 5.5098054259890565e-08, "epoch": 19.148793565683647, "percentage": 95.74, "elapsed_time": "4:30:19", "remaining_time": "0:12:00", "throughput": 4084.5, "total_tokens": 66246584} +{"current_steps": 114285, "total_steps": 119360, "loss": 0.2327, "lr": 5.498986733476319e-08, "epoch": 19.149631367292226, "percentage": 95.75, "elapsed_time": "4:30:19", "remaining_time": "0:12:00", "throughput": 4084.5, "total_tokens": 66249176} +{"current_steps": 114290, "total_steps": 119360, "loss": 0.3013, "lr": 5.4881786141113835e-08, "epoch": 19.150469168900806, "percentage": 95.75, "elapsed_time": "4:30:20", "remaining_time": "0:11:59", "throughput": 4084.51, "total_tokens": 66252184} +{"current_steps": 114295, "total_steps": 119360, "loss": 0.456, "lr": 5.477381068125232e-08, "epoch": 19.151306970509385, "percentage": 95.76, "elapsed_time": "4:30:21", "remaining_time": "0:11:58", "throughput": 4084.53, "total_tokens": 66255224} +{"current_steps": 114300, "total_steps": 119360, "loss": 0.1321, "lr": 5.46659409574879e-08, "epoch": 19.152144772117964, "percentage": 95.76, "elapsed_time": "4:30:21", "remaining_time": "0:11:58", "throughput": 4084.54, "total_tokens": 66258040} +{"current_steps": 114305, "total_steps": 119360, "loss": 0.3336, "lr": 5.455817697212595e-08, "epoch": 19.15298257372654, "percentage": 95.76, "elapsed_time": "4:30:22", "remaining_time": "0:11:57", "throughput": 4084.55, "total_tokens": 66261016} +{"current_steps": 114310, "total_steps": 119360, "loss": 0.347, "lr": 5.4450518727471865e-08, "epoch": 19.15382037533512, "percentage": 95.77, "elapsed_time": "4:30:23", "remaining_time": "0:11:56", "throughput": 4084.56, "total_tokens": 66263928} +{"current_steps": 114315, "total_steps": 119360, "loss": 0.3094, "lr": 5.434296622582713e-08, "epoch": 19.1546581769437, "percentage": 95.77, "elapsed_time": "4:30:23", "remaining_time": "0:11:55", "throughput": 4084.56, "total_tokens": 66266712} +{"current_steps": 114320, "total_steps": 119360, "loss": 0.3431, "lr": 5.423551946949102e-08, "epoch": 19.155495978552278, "percentage": 95.78, "elapsed_time": "4:30:24", "remaining_time": "0:11:55", "throughput": 4084.57, "total_tokens": 66269336} +{"current_steps": 114325, "total_steps": 119360, "loss": 0.4333, "lr": 5.412817846076168e-08, "epoch": 19.156333780160857, "percentage": 95.78, "elapsed_time": "4:30:25", "remaining_time": "0:11:54", "throughput": 4084.58, "total_tokens": 66272312} +{"current_steps": 114330, "total_steps": 119360, "loss": 0.3216, "lr": 5.4020943201933405e-08, "epoch": 19.157171581769436, "percentage": 95.79, "elapsed_time": "4:30:25", "remaining_time": "0:11:53", "throughput": 4084.59, "total_tokens": 66275192} +{"current_steps": 114335, "total_steps": 119360, "loss": 0.3112, "lr": 5.3913813695299355e-08, "epoch": 19.158009383378015, "percentage": 95.79, "elapsed_time": "4:30:26", "remaining_time": "0:11:53", "throughput": 4084.6, "total_tokens": 66278168} +{"current_steps": 114340, "total_steps": 119360, "loss": 0.2206, "lr": 5.380678994314992e-08, "epoch": 19.158847184986595, "percentage": 95.79, "elapsed_time": "4:30:27", "remaining_time": "0:11:52", "throughput": 4084.61, "total_tokens": 66281144} +{"current_steps": 114345, "total_steps": 119360, "loss": 0.3012, "lr": 5.369987194777382e-08, "epoch": 19.159684986595174, "percentage": 95.8, "elapsed_time": "4:30:27", "remaining_time": "0:11:51", "throughput": 4084.62, "total_tokens": 66284120} +{"current_steps": 114350, "total_steps": 119360, "loss": 0.2375, "lr": 5.359305971145701e-08, "epoch": 19.160522788203753, "percentage": 95.8, "elapsed_time": "4:30:28", "remaining_time": "0:11:51", "throughput": 4084.62, "total_tokens": 66287000} +{"current_steps": 114355, "total_steps": 119360, "loss": 0.3523, "lr": 5.348635323648321e-08, "epoch": 19.161360589812332, "percentage": 95.81, "elapsed_time": "4:30:29", "remaining_time": "0:11:50", "throughput": 4084.62, "total_tokens": 66289560} +{"current_steps": 114360, "total_steps": 119360, "loss": 0.242, "lr": 5.3379752525133944e-08, "epoch": 19.16219839142091, "percentage": 95.81, "elapsed_time": "4:30:29", "remaining_time": "0:11:49", "throughput": 4084.64, "total_tokens": 66292824} +{"current_steps": 114365, "total_steps": 119360, "loss": 0.2718, "lr": 5.327325757968793e-08, "epoch": 19.16303619302949, "percentage": 95.82, "elapsed_time": "4:30:30", "remaining_time": "0:11:48", "throughput": 4084.66, "total_tokens": 66296056} +{"current_steps": 114370, "total_steps": 119360, "loss": 0.3182, "lr": 5.3166868402423355e-08, "epoch": 19.16387399463807, "percentage": 95.82, "elapsed_time": "4:30:31", "remaining_time": "0:11:48", "throughput": 4084.67, "total_tokens": 66299096} +{"current_steps": 114375, "total_steps": 119360, "loss": 0.2407, "lr": 5.306058499561395e-08, "epoch": 19.16471179624665, "percentage": 95.82, "elapsed_time": "4:30:31", "remaining_time": "0:11:47", "throughput": 4084.68, "total_tokens": 66301912} +{"current_steps": 114380, "total_steps": 119360, "loss": 0.3841, "lr": 5.29544073615329e-08, "epoch": 19.16554959785523, "percentage": 95.83, "elapsed_time": "4:30:32", "remaining_time": "0:11:46", "throughput": 4084.69, "total_tokens": 66305016} +{"current_steps": 114385, "total_steps": 119360, "loss": 0.2856, "lr": 5.284833550245005e-08, "epoch": 19.166387399463808, "percentage": 95.83, "elapsed_time": "4:30:33", "remaining_time": "0:11:46", "throughput": 4084.7, "total_tokens": 66307960} +{"current_steps": 114390, "total_steps": 119360, "loss": 0.3389, "lr": 5.27423694206336e-08, "epoch": 19.167225201072387, "percentage": 95.84, "elapsed_time": "4:30:33", "remaining_time": "0:11:45", "throughput": 4084.71, "total_tokens": 66310808} +{"current_steps": 114395, "total_steps": 119360, "loss": 0.4892, "lr": 5.263650911834894e-08, "epoch": 19.168063002680967, "percentage": 95.84, "elapsed_time": "4:30:34", "remaining_time": "0:11:44", "throughput": 4084.71, "total_tokens": 66313592} +{"current_steps": 114400, "total_steps": 119360, "loss": 0.1114, "lr": 5.253075459785983e-08, "epoch": 19.168900804289546, "percentage": 95.84, "elapsed_time": "4:30:35", "remaining_time": "0:11:43", "throughput": 4084.72, "total_tokens": 66316344} +{"current_steps": 114405, "total_steps": 119360, "loss": 0.3761, "lr": 5.2425105861427794e-08, "epoch": 19.16973860589812, "percentage": 95.85, "elapsed_time": "4:30:35", "remaining_time": "0:11:43", "throughput": 4084.72, "total_tokens": 66318968} +{"current_steps": 114410, "total_steps": 119360, "loss": 0.5327, "lr": 5.231956291131046e-08, "epoch": 19.1705764075067, "percentage": 95.85, "elapsed_time": "4:30:36", "remaining_time": "0:11:42", "throughput": 4084.73, "total_tokens": 66321784} +{"current_steps": 114415, "total_steps": 119360, "loss": 0.461, "lr": 5.2214125749766033e-08, "epoch": 19.17141420911528, "percentage": 95.86, "elapsed_time": "4:30:37", "remaining_time": "0:11:41", "throughput": 4084.74, "total_tokens": 66324792} +{"current_steps": 114420, "total_steps": 119360, "loss": 0.2251, "lr": 5.21087943790477e-08, "epoch": 19.17225201072386, "percentage": 95.86, "elapsed_time": "4:30:37", "remaining_time": "0:11:41", "throughput": 4084.76, "total_tokens": 66327928} +{"current_steps": 114425, "total_steps": 119360, "loss": 0.3735, "lr": 5.2003568801408664e-08, "epoch": 19.17308981233244, "percentage": 95.87, "elapsed_time": "4:30:38", "remaining_time": "0:11:40", "throughput": 4084.76, "total_tokens": 66331128} +{"current_steps": 114430, "total_steps": 119360, "loss": 0.3337, "lr": 5.189844901909769e-08, "epoch": 19.173927613941018, "percentage": 95.87, "elapsed_time": "4:30:39", "remaining_time": "0:11:39", "throughput": 4084.77, "total_tokens": 66333624} +{"current_steps": 114435, "total_steps": 119360, "loss": 0.1582, "lr": 5.179343503436296e-08, "epoch": 19.174765415549597, "percentage": 95.87, "elapsed_time": "4:30:39", "remaining_time": "0:11:38", "throughput": 4084.77, "total_tokens": 66336376} +{"current_steps": 114440, "total_steps": 119360, "loss": 0.4089, "lr": 5.168852684944992e-08, "epoch": 19.175603217158177, "percentage": 95.88, "elapsed_time": "4:30:40", "remaining_time": "0:11:38", "throughput": 4084.78, "total_tokens": 66339288} +{"current_steps": 114445, "total_steps": 119360, "loss": 0.1669, "lr": 5.1583724466601756e-08, "epoch": 19.176441018766756, "percentage": 95.88, "elapsed_time": "4:30:41", "remaining_time": "0:11:37", "throughput": 4084.79, "total_tokens": 66342520} +{"current_steps": 114450, "total_steps": 119360, "loss": 0.4349, "lr": 5.147902788805892e-08, "epoch": 19.177278820375335, "percentage": 95.89, "elapsed_time": "4:30:42", "remaining_time": "0:11:36", "throughput": 4084.8, "total_tokens": 66345336} +{"current_steps": 114455, "total_steps": 119360, "loss": 0.4376, "lr": 5.137443711606016e-08, "epoch": 19.178116621983914, "percentage": 95.89, "elapsed_time": "4:30:42", "remaining_time": "0:11:36", "throughput": 4084.8, "total_tokens": 66348120} +{"current_steps": 114460, "total_steps": 119360, "loss": 0.376, "lr": 5.1269952152842026e-08, "epoch": 19.178954423592494, "percentage": 95.89, "elapsed_time": "4:30:43", "remaining_time": "0:11:35", "throughput": 4084.81, "total_tokens": 66350936} +{"current_steps": 114465, "total_steps": 119360, "loss": 0.3941, "lr": 5.116557300063774e-08, "epoch": 19.179792225201073, "percentage": 95.9, "elapsed_time": "4:30:43", "remaining_time": "0:11:34", "throughput": 4084.82, "total_tokens": 66353656} +{"current_steps": 114470, "total_steps": 119360, "loss": 0.4244, "lr": 5.106129966167994e-08, "epoch": 19.180630026809652, "percentage": 95.9, "elapsed_time": "4:30:44", "remaining_time": "0:11:33", "throughput": 4084.82, "total_tokens": 66356408} +{"current_steps": 114475, "total_steps": 119360, "loss": 0.1065, "lr": 5.095713213819797e-08, "epoch": 19.18146782841823, "percentage": 95.91, "elapsed_time": "4:30:45", "remaining_time": "0:11:33", "throughput": 4084.84, "total_tokens": 66359544} +{"current_steps": 114480, "total_steps": 119360, "loss": 0.373, "lr": 5.085307043241838e-08, "epoch": 19.18230563002681, "percentage": 95.91, "elapsed_time": "4:30:45", "remaining_time": "0:11:32", "throughput": 4084.85, "total_tokens": 66362232} +{"current_steps": 114485, "total_steps": 119360, "loss": 0.3964, "lr": 5.074911454656717e-08, "epoch": 19.18314343163539, "percentage": 95.92, "elapsed_time": "4:30:46", "remaining_time": "0:11:31", "throughput": 4084.86, "total_tokens": 66365240} +{"current_steps": 114490, "total_steps": 119360, "loss": 0.1897, "lr": 5.0645264482866444e-08, "epoch": 19.18398123324397, "percentage": 95.92, "elapsed_time": "4:30:47", "remaining_time": "0:11:31", "throughput": 4084.87, "total_tokens": 66368120} +{"current_steps": 114495, "total_steps": 119360, "loss": 0.4845, "lr": 5.05415202435372e-08, "epoch": 19.18481903485255, "percentage": 95.92, "elapsed_time": "4:30:47", "remaining_time": "0:11:30", "throughput": 4084.88, "total_tokens": 66370904} +{"current_steps": 114500, "total_steps": 119360, "loss": 0.4516, "lr": 5.043788183079712e-08, "epoch": 19.185656836461128, "percentage": 95.93, "elapsed_time": "4:30:48", "remaining_time": "0:11:29", "throughput": 4084.89, "total_tokens": 66373720} +{"current_steps": 114505, "total_steps": 119360, "loss": 0.2177, "lr": 5.03343492468622e-08, "epoch": 19.186494638069703, "percentage": 95.93, "elapsed_time": "4:30:49", "remaining_time": "0:11:28", "throughput": 4084.9, "total_tokens": 66376792} +{"current_steps": 114510, "total_steps": 119360, "loss": 0.3281, "lr": 5.0230922493946234e-08, "epoch": 19.187332439678283, "percentage": 95.94, "elapsed_time": "4:30:49", "remaining_time": "0:11:28", "throughput": 4084.91, "total_tokens": 66379672} +{"current_steps": 114515, "total_steps": 119360, "loss": 0.3623, "lr": 5.012760157426022e-08, "epoch": 19.188170241286862, "percentage": 95.94, "elapsed_time": "4:30:50", "remaining_time": "0:11:27", "throughput": 4084.93, "total_tokens": 66382616} +{"current_steps": 114520, "total_steps": 119360, "loss": 0.402, "lr": 5.002438649001462e-08, "epoch": 19.18900804289544, "percentage": 95.95, "elapsed_time": "4:30:51", "remaining_time": "0:11:26", "throughput": 4084.93, "total_tokens": 66385400} +{"current_steps": 114525, "total_steps": 119360, "loss": 0.5171, "lr": 4.992127724341489e-08, "epoch": 19.18984584450402, "percentage": 95.95, "elapsed_time": "4:30:51", "remaining_time": "0:11:26", "throughput": 4084.94, "total_tokens": 66388312} +{"current_steps": 114530, "total_steps": 119360, "loss": 0.4827, "lr": 4.981827383666593e-08, "epoch": 19.1906836461126, "percentage": 95.95, "elapsed_time": "4:30:52", "remaining_time": "0:11:25", "throughput": 4084.95, "total_tokens": 66391064} +{"current_steps": 114535, "total_steps": 119360, "loss": 0.4469, "lr": 4.971537627197098e-08, "epoch": 19.19152144772118, "percentage": 95.96, "elapsed_time": "4:30:53", "remaining_time": "0:11:24", "throughput": 4084.95, "total_tokens": 66393688} +{"current_steps": 114540, "total_steps": 119360, "loss": 0.3983, "lr": 4.961258455152884e-08, "epoch": 19.19235924932976, "percentage": 95.96, "elapsed_time": "4:30:53", "remaining_time": "0:11:23", "throughput": 4084.96, "total_tokens": 66396568} +{"current_steps": 114545, "total_steps": 119360, "loss": 0.5379, "lr": 4.9509898677538305e-08, "epoch": 19.193197050938338, "percentage": 95.97, "elapsed_time": "4:30:54", "remaining_time": "0:11:23", "throughput": 4084.97, "total_tokens": 66399416} +{"current_steps": 114550, "total_steps": 119360, "loss": 0.2046, "lr": 4.940731865219484e-08, "epoch": 19.194034852546917, "percentage": 95.97, "elapsed_time": "4:30:55", "remaining_time": "0:11:22", "throughput": 4084.97, "total_tokens": 66402232} +{"current_steps": 114555, "total_steps": 119360, "loss": 0.2689, "lr": 4.930484447769168e-08, "epoch": 19.194872654155496, "percentage": 95.97, "elapsed_time": "4:30:55", "remaining_time": "0:11:21", "throughput": 4084.98, "total_tokens": 66405208} +{"current_steps": 114560, "total_steps": 119360, "loss": 0.298, "lr": 4.920247615621931e-08, "epoch": 19.195710455764075, "percentage": 95.98, "elapsed_time": "4:30:56", "remaining_time": "0:11:21", "throughput": 4084.99, "total_tokens": 66407800} +{"current_steps": 114565, "total_steps": 119360, "loss": 0.5921, "lr": 4.910021368996765e-08, "epoch": 19.196548257372655, "percentage": 95.98, "elapsed_time": "4:30:57", "remaining_time": "0:11:20", "throughput": 4085.0, "total_tokens": 66411000} +{"current_steps": 114570, "total_steps": 119360, "loss": 0.2244, "lr": 4.89980570811216e-08, "epoch": 19.197386058981234, "percentage": 95.99, "elapsed_time": "4:30:57", "remaining_time": "0:11:19", "throughput": 4085.01, "total_tokens": 66413688} +{"current_steps": 114575, "total_steps": 119360, "loss": 0.6563, "lr": 4.889600633186664e-08, "epoch": 19.198223860589813, "percentage": 95.99, "elapsed_time": "4:30:58", "remaining_time": "0:11:19", "throughput": 4085.01, "total_tokens": 66416632} +{"current_steps": 114580, "total_steps": 119360, "loss": 0.2553, "lr": 4.879406144438492e-08, "epoch": 19.199061662198392, "percentage": 96.0, "elapsed_time": "4:30:59", "remaining_time": "0:11:18", "throughput": 4085.01, "total_tokens": 66419256} +{"current_steps": 114585, "total_steps": 119360, "loss": 0.3673, "lr": 4.869222242085525e-08, "epoch": 19.19989946380697, "percentage": 96.0, "elapsed_time": "4:30:59", "remaining_time": "0:11:17", "throughput": 4085.02, "total_tokens": 66422008} +{"current_steps": 114590, "total_steps": 119360, "loss": 0.4281, "lr": 4.859048926345589e-08, "epoch": 19.20073726541555, "percentage": 96.0, "elapsed_time": "4:31:00", "remaining_time": "0:11:16", "throughput": 4085.03, "total_tokens": 66424824} +{"current_steps": 114595, "total_steps": 119360, "loss": 0.3876, "lr": 4.8488861974361756e-08, "epoch": 19.20157506702413, "percentage": 96.01, "elapsed_time": "4:31:01", "remaining_time": "0:11:16", "throughput": 4085.03, "total_tokens": 66427448} +{"current_steps": 114600, "total_steps": 119360, "loss": 0.2936, "lr": 4.838734055574557e-08, "epoch": 19.202412868632706, "percentage": 96.01, "elapsed_time": "4:31:01", "remaining_time": "0:11:15", "throughput": 4085.04, "total_tokens": 66430296} +{"current_steps": 114605, "total_steps": 119360, "loss": 0.3113, "lr": 4.828592500977836e-08, "epoch": 19.203250670241285, "percentage": 96.02, "elapsed_time": "4:31:02", "remaining_time": "0:11:14", "throughput": 4085.05, "total_tokens": 66433304} +{"current_steps": 114610, "total_steps": 119360, "loss": 0.5518, "lr": 4.818461533862839e-08, "epoch": 19.204088471849865, "percentage": 96.02, "elapsed_time": "4:31:03", "remaining_time": "0:11:14", "throughput": 4085.06, "total_tokens": 66436024} +{"current_steps": 114615, "total_steps": 119360, "loss": 0.2959, "lr": 4.808341154446117e-08, "epoch": 19.204926273458444, "percentage": 96.02, "elapsed_time": "4:31:03", "remaining_time": "0:11:13", "throughput": 4085.06, "total_tokens": 66438744} +{"current_steps": 114620, "total_steps": 119360, "loss": 0.3839, "lr": 4.7982313629441614e-08, "epoch": 19.205764075067023, "percentage": 96.03, "elapsed_time": "4:31:04", "remaining_time": "0:11:12", "throughput": 4085.07, "total_tokens": 66441816} +{"current_steps": 114625, "total_steps": 119360, "loss": 0.1636, "lr": 4.788132159573133e-08, "epoch": 19.206601876675602, "percentage": 96.03, "elapsed_time": "4:31:05", "remaining_time": "0:11:11", "throughput": 4085.08, "total_tokens": 66444728} +{"current_steps": 114630, "total_steps": 119360, "loss": 0.1967, "lr": 4.778043544548916e-08, "epoch": 19.20743967828418, "percentage": 96.04, "elapsed_time": "4:31:05", "remaining_time": "0:11:11", "throughput": 4085.09, "total_tokens": 66447544} +{"current_steps": 114635, "total_steps": 119360, "loss": 0.2697, "lr": 4.7679655180871697e-08, "epoch": 19.20827747989276, "percentage": 96.04, "elapsed_time": "4:31:06", "remaining_time": "0:11:10", "throughput": 4085.1, "total_tokens": 66450360} +{"current_steps": 114640, "total_steps": 119360, "loss": 0.3777, "lr": 4.7578980804035e-08, "epoch": 19.20911528150134, "percentage": 96.05, "elapsed_time": "4:31:07", "remaining_time": "0:11:09", "throughput": 4085.11, "total_tokens": 66453496} +{"current_steps": 114645, "total_steps": 119360, "loss": 0.2615, "lr": 4.7478412317130686e-08, "epoch": 19.20995308310992, "percentage": 96.05, "elapsed_time": "4:31:07", "remaining_time": "0:11:09", "throughput": 4085.11, "total_tokens": 66456216} +{"current_steps": 114650, "total_steps": 119360, "loss": 0.1571, "lr": 4.737794972230925e-08, "epoch": 19.2107908847185, "percentage": 96.05, "elapsed_time": "4:31:08", "remaining_time": "0:11:08", "throughput": 4085.13, "total_tokens": 66459256} +{"current_steps": 114655, "total_steps": 119360, "loss": 0.1753, "lr": 4.727759302171953e-08, "epoch": 19.211628686327078, "percentage": 96.06, "elapsed_time": "4:31:09", "remaining_time": "0:11:07", "throughput": 4085.13, "total_tokens": 66462136} +{"current_steps": 114660, "total_steps": 119360, "loss": 0.4686, "lr": 4.7177342217505914e-08, "epoch": 19.212466487935657, "percentage": 96.06, "elapsed_time": "4:31:09", "remaining_time": "0:11:06", "throughput": 4085.14, "total_tokens": 66465176} +{"current_steps": 114665, "total_steps": 119360, "loss": 0.5293, "lr": 4.707719731181282e-08, "epoch": 19.213304289544237, "percentage": 96.07, "elapsed_time": "4:31:10", "remaining_time": "0:11:06", "throughput": 4085.15, "total_tokens": 66467960} +{"current_steps": 114670, "total_steps": 119360, "loss": 0.3078, "lr": 4.697715830678184e-08, "epoch": 19.214142091152816, "percentage": 96.07, "elapsed_time": "4:31:11", "remaining_time": "0:11:05", "throughput": 4085.16, "total_tokens": 66470872} +{"current_steps": 114675, "total_steps": 119360, "loss": 0.2211, "lr": 4.687722520455073e-08, "epoch": 19.214979892761395, "percentage": 96.07, "elapsed_time": "4:31:11", "remaining_time": "0:11:04", "throughput": 4085.17, "total_tokens": 66473816} +{"current_steps": 114680, "total_steps": 119360, "loss": 0.2651, "lr": 4.677739800725667e-08, "epoch": 19.215817694369974, "percentage": 96.08, "elapsed_time": "4:31:12", "remaining_time": "0:11:04", "throughput": 4085.18, "total_tokens": 66476664} +{"current_steps": 114685, "total_steps": 119360, "loss": 0.3435, "lr": 4.667767671703516e-08, "epoch": 19.216655495978554, "percentage": 96.08, "elapsed_time": "4:31:13", "remaining_time": "0:11:03", "throughput": 4085.19, "total_tokens": 66479736} +{"current_steps": 114690, "total_steps": 119360, "loss": 0.1735, "lr": 4.657806133601728e-08, "epoch": 19.217493297587133, "percentage": 96.09, "elapsed_time": "4:31:14", "remaining_time": "0:11:02", "throughput": 4085.19, "total_tokens": 66482424} +{"current_steps": 114695, "total_steps": 119360, "loss": 0.1194, "lr": 4.647855186633299e-08, "epoch": 19.218331099195712, "percentage": 96.09, "elapsed_time": "4:31:14", "remaining_time": "0:11:01", "throughput": 4085.19, "total_tokens": 66485336} +{"current_steps": 114700, "total_steps": 119360, "loss": 0.2914, "lr": 4.6379148310110034e-08, "epoch": 19.219168900804288, "percentage": 96.1, "elapsed_time": "4:31:15", "remaining_time": "0:11:01", "throughput": 4085.2, "total_tokens": 66488184} +{"current_steps": 114705, "total_steps": 119360, "loss": 0.3143, "lr": 4.627985066947394e-08, "epoch": 19.220006702412867, "percentage": 96.1, "elapsed_time": "4:31:16", "remaining_time": "0:11:00", "throughput": 4085.21, "total_tokens": 66491000} +{"current_steps": 114710, "total_steps": 119360, "loss": 0.1514, "lr": 4.6180658946547995e-08, "epoch": 19.220844504021446, "percentage": 96.1, "elapsed_time": "4:31:16", "remaining_time": "0:10:59", "throughput": 4085.21, "total_tokens": 66493912} +{"current_steps": 114715, "total_steps": 119360, "loss": 0.2173, "lr": 4.6081573143453296e-08, "epoch": 19.221682305630026, "percentage": 96.11, "elapsed_time": "4:31:17", "remaining_time": "0:10:59", "throughput": 4085.22, "total_tokens": 66496824} +{"current_steps": 114720, "total_steps": 119360, "loss": 0.3494, "lr": 4.598259326230758e-08, "epoch": 19.222520107238605, "percentage": 96.11, "elapsed_time": "4:31:18", "remaining_time": "0:10:58", "throughput": 4085.24, "total_tokens": 66499960} +{"current_steps": 114725, "total_steps": 119360, "loss": 0.4875, "lr": 4.5883719305227504e-08, "epoch": 19.223357908847184, "percentage": 96.12, "elapsed_time": "4:31:18", "remaining_time": "0:10:57", "throughput": 4085.24, "total_tokens": 66502520} +{"current_steps": 114730, "total_steps": 119360, "loss": 0.281, "lr": 4.578495127432803e-08, "epoch": 19.224195710455763, "percentage": 96.12, "elapsed_time": "4:31:19", "remaining_time": "0:10:56", "throughput": 4085.26, "total_tokens": 66505688} +{"current_steps": 114735, "total_steps": 119360, "loss": 0.27, "lr": 4.568628917171969e-08, "epoch": 19.225033512064343, "percentage": 96.13, "elapsed_time": "4:31:20", "remaining_time": "0:10:56", "throughput": 4085.27, "total_tokens": 66508824} +{"current_steps": 114740, "total_steps": 119360, "loss": 0.5223, "lr": 4.558773299951247e-08, "epoch": 19.225871313672922, "percentage": 96.13, "elapsed_time": "4:31:20", "remaining_time": "0:10:55", "throughput": 4085.27, "total_tokens": 66511480} +{"current_steps": 114745, "total_steps": 119360, "loss": 0.068, "lr": 4.5489282759814125e-08, "epoch": 19.2267091152815, "percentage": 96.13, "elapsed_time": "4:31:21", "remaining_time": "0:10:54", "throughput": 4085.28, "total_tokens": 66514488} +{"current_steps": 114750, "total_steps": 119360, "loss": 0.1389, "lr": 4.539093845472908e-08, "epoch": 19.22754691689008, "percentage": 96.14, "elapsed_time": "4:31:22", "remaining_time": "0:10:54", "throughput": 4085.29, "total_tokens": 66517240} +{"current_steps": 114755, "total_steps": 119360, "loss": 0.3899, "lr": 4.529270008636011e-08, "epoch": 19.22838471849866, "percentage": 96.14, "elapsed_time": "4:31:22", "remaining_time": "0:10:53", "throughput": 4085.3, "total_tokens": 66519960} +{"current_steps": 114760, "total_steps": 119360, "loss": 0.4562, "lr": 4.5194567656807743e-08, "epoch": 19.22922252010724, "percentage": 96.15, "elapsed_time": "4:31:23", "remaining_time": "0:10:52", "throughput": 4085.3, "total_tokens": 66522520} +{"current_steps": 114765, "total_steps": 119360, "loss": 0.137, "lr": 4.5096541168170305e-08, "epoch": 19.23006032171582, "percentage": 96.15, "elapsed_time": "4:31:24", "remaining_time": "0:10:51", "throughput": 4085.31, "total_tokens": 66525496} +{"current_steps": 114770, "total_steps": 119360, "loss": 0.2101, "lr": 4.49986206225439e-08, "epoch": 19.230898123324398, "percentage": 96.15, "elapsed_time": "4:31:24", "remaining_time": "0:10:51", "throughput": 4085.31, "total_tokens": 66528280} +{"current_steps": 114775, "total_steps": 119360, "loss": 0.4955, "lr": 4.4900806022022404e-08, "epoch": 19.231735924932977, "percentage": 96.16, "elapsed_time": "4:31:25", "remaining_time": "0:10:50", "throughput": 4085.32, "total_tokens": 66531064} +{"current_steps": 114780, "total_steps": 119360, "loss": 0.1868, "lr": 4.480309736869637e-08, "epoch": 19.232573726541556, "percentage": 96.16, "elapsed_time": "4:31:26", "remaining_time": "0:10:49", "throughput": 4085.33, "total_tokens": 66533880} +{"current_steps": 114785, "total_steps": 119360, "loss": 0.2978, "lr": 4.4705494664655234e-08, "epoch": 19.233411528150135, "percentage": 96.17, "elapsed_time": "4:31:26", "remaining_time": "0:10:49", "throughput": 4085.34, "total_tokens": 66536632} +{"current_steps": 114790, "total_steps": 119360, "loss": 0.1842, "lr": 4.4607997911986776e-08, "epoch": 19.234249329758715, "percentage": 96.17, "elapsed_time": "4:31:27", "remaining_time": "0:10:48", "throughput": 4085.34, "total_tokens": 66539384} +{"current_steps": 114795, "total_steps": 119360, "loss": 0.3732, "lr": 4.4510607112774884e-08, "epoch": 19.235087131367294, "percentage": 96.18, "elapsed_time": "4:31:28", "remaining_time": "0:10:47", "throughput": 4085.35, "total_tokens": 66542328} +{"current_steps": 114800, "total_steps": 119360, "loss": 0.2451, "lr": 4.441332226910122e-08, "epoch": 19.23592493297587, "percentage": 96.18, "elapsed_time": "4:31:28", "remaining_time": "0:10:47", "throughput": 4085.36, "total_tokens": 66545176} +{"current_steps": 114805, "total_steps": 119360, "loss": 0.311, "lr": 4.4316143383047463e-08, "epoch": 19.23676273458445, "percentage": 96.18, "elapsed_time": "4:31:29", "remaining_time": "0:10:46", "throughput": 4085.37, "total_tokens": 66548056} +{"current_steps": 114810, "total_steps": 119360, "loss": 0.3953, "lr": 4.421907045669027e-08, "epoch": 19.23760053619303, "percentage": 96.19, "elapsed_time": "4:31:29", "remaining_time": "0:10:45", "throughput": 4085.38, "total_tokens": 66550744} +{"current_steps": 114815, "total_steps": 119360, "loss": 0.3258, "lr": 4.412210349210522e-08, "epoch": 19.238438337801608, "percentage": 96.19, "elapsed_time": "4:31:30", "remaining_time": "0:10:44", "throughput": 4085.38, "total_tokens": 66553592} +{"current_steps": 114820, "total_steps": 119360, "loss": 0.4332, "lr": 4.402524249136619e-08, "epoch": 19.239276139410187, "percentage": 96.2, "elapsed_time": "4:31:31", "remaining_time": "0:10:44", "throughput": 4085.39, "total_tokens": 66556472} +{"current_steps": 114825, "total_steps": 119360, "loss": 0.2562, "lr": 4.3928487456543765e-08, "epoch": 19.240113941018766, "percentage": 96.2, "elapsed_time": "4:31:31", "remaining_time": "0:10:43", "throughput": 4085.41, "total_tokens": 66559416} +{"current_steps": 114830, "total_steps": 119360, "loss": 0.7035, "lr": 4.383183838970739e-08, "epoch": 19.240951742627345, "percentage": 96.2, "elapsed_time": "4:31:32", "remaining_time": "0:10:42", "throughput": 4085.42, "total_tokens": 66562712} +{"current_steps": 114835, "total_steps": 119360, "loss": 0.3384, "lr": 4.3735295292923196e-08, "epoch": 19.241789544235925, "percentage": 96.21, "elapsed_time": "4:31:33", "remaining_time": "0:10:42", "throughput": 4085.43, "total_tokens": 66565592} +{"current_steps": 114840, "total_steps": 119360, "loss": 0.088, "lr": 4.3638858168254524e-08, "epoch": 19.242627345844504, "percentage": 96.21, "elapsed_time": "4:31:34", "remaining_time": "0:10:41", "throughput": 4085.45, "total_tokens": 66568664} +{"current_steps": 114845, "total_steps": 119360, "loss": 0.3018, "lr": 4.354252701776418e-08, "epoch": 19.243465147453083, "percentage": 96.22, "elapsed_time": "4:31:34", "remaining_time": "0:10:40", "throughput": 4085.45, "total_tokens": 66571544} +{"current_steps": 114850, "total_steps": 119360, "loss": 0.4534, "lr": 4.344630184351217e-08, "epoch": 19.244302949061662, "percentage": 96.22, "elapsed_time": "4:31:35", "remaining_time": "0:10:39", "throughput": 4085.47, "total_tokens": 66574424} +{"current_steps": 114855, "total_steps": 119360, "loss": 0.2795, "lr": 4.335018264755519e-08, "epoch": 19.24514075067024, "percentage": 96.23, "elapsed_time": "4:31:36", "remaining_time": "0:10:39", "throughput": 4085.47, "total_tokens": 66577016} +{"current_steps": 114860, "total_steps": 119360, "loss": 0.2189, "lr": 4.325416943194938e-08, "epoch": 19.24597855227882, "percentage": 96.23, "elapsed_time": "4:31:36", "remaining_time": "0:10:38", "throughput": 4085.47, "total_tokens": 66579864} +{"current_steps": 114865, "total_steps": 119360, "loss": 0.209, "lr": 4.3158262198746414e-08, "epoch": 19.2468163538874, "percentage": 96.23, "elapsed_time": "4:31:37", "remaining_time": "0:10:37", "throughput": 4085.49, "total_tokens": 66582904} +{"current_steps": 114870, "total_steps": 119360, "loss": 0.3211, "lr": 4.3062460949997445e-08, "epoch": 19.24765415549598, "percentage": 96.24, "elapsed_time": "4:31:38", "remaining_time": "0:10:37", "throughput": 4085.5, "total_tokens": 66585784} +{"current_steps": 114875, "total_steps": 119360, "loss": 0.3891, "lr": 4.296676568775138e-08, "epoch": 19.24849195710456, "percentage": 96.24, "elapsed_time": "4:31:38", "remaining_time": "0:10:36", "throughput": 4085.52, "total_tokens": 66588888} +{"current_steps": 114880, "total_steps": 119360, "loss": 0.1421, "lr": 4.28711764140538e-08, "epoch": 19.249329758713138, "percentage": 96.25, "elapsed_time": "4:31:39", "remaining_time": "0:10:35", "throughput": 4085.53, "total_tokens": 66591736} +{"current_steps": 114885, "total_steps": 119360, "loss": 0.5263, "lr": 4.2775693130948094e-08, "epoch": 19.250167560321717, "percentage": 96.25, "elapsed_time": "4:31:40", "remaining_time": "0:10:34", "throughput": 4085.54, "total_tokens": 66594808} +{"current_steps": 114890, "total_steps": 119360, "loss": 0.4333, "lr": 4.2680315840476496e-08, "epoch": 19.251005361930297, "percentage": 96.26, "elapsed_time": "4:31:40", "remaining_time": "0:10:34", "throughput": 4085.55, "total_tokens": 66597624} +{"current_steps": 114895, "total_steps": 119360, "loss": 0.2475, "lr": 4.258504454467849e-08, "epoch": 19.251843163538872, "percentage": 96.26, "elapsed_time": "4:31:41", "remaining_time": "0:10:33", "throughput": 4085.56, "total_tokens": 66600536} +{"current_steps": 114900, "total_steps": 119360, "loss": 0.5785, "lr": 4.248987924559078e-08, "epoch": 19.25268096514745, "percentage": 96.26, "elapsed_time": "4:31:42", "remaining_time": "0:10:32", "throughput": 4085.57, "total_tokens": 66603352} +{"current_steps": 114905, "total_steps": 119360, "loss": 0.2209, "lr": 4.2394819945247855e-08, "epoch": 19.25351876675603, "percentage": 96.27, "elapsed_time": "4:31:42", "remaining_time": "0:10:32", "throughput": 4085.59, "total_tokens": 66606520} +{"current_steps": 114910, "total_steps": 119360, "loss": 0.351, "lr": 4.229986664568253e-08, "epoch": 19.25435656836461, "percentage": 96.27, "elapsed_time": "4:31:43", "remaining_time": "0:10:31", "throughput": 4085.6, "total_tokens": 66609592} +{"current_steps": 114915, "total_steps": 119360, "loss": 0.127, "lr": 4.2205019348925405e-08, "epoch": 19.25519436997319, "percentage": 96.28, "elapsed_time": "4:31:44", "remaining_time": "0:10:30", "throughput": 4085.6, "total_tokens": 66612312} +{"current_steps": 114920, "total_steps": 119360, "loss": 0.3185, "lr": 4.2110278057003736e-08, "epoch": 19.25603217158177, "percentage": 96.28, "elapsed_time": "4:31:44", "remaining_time": "0:10:29", "throughput": 4085.61, "total_tokens": 66615128} +{"current_steps": 114925, "total_steps": 119360, "loss": 0.4942, "lr": 4.201564277194314e-08, "epoch": 19.256869973190348, "percentage": 96.28, "elapsed_time": "4:31:45", "remaining_time": "0:10:29", "throughput": 4085.63, "total_tokens": 66618232} +{"current_steps": 114930, "total_steps": 119360, "loss": 0.3341, "lr": 4.192111349576811e-08, "epoch": 19.257707774798927, "percentage": 96.29, "elapsed_time": "4:31:46", "remaining_time": "0:10:28", "throughput": 4085.64, "total_tokens": 66621176} +{"current_steps": 114935, "total_steps": 119360, "loss": 0.2613, "lr": 4.182669023049923e-08, "epoch": 19.258545576407506, "percentage": 96.29, "elapsed_time": "4:31:46", "remaining_time": "0:10:27", "throughput": 4085.65, "total_tokens": 66624184} +{"current_steps": 114940, "total_steps": 119360, "loss": 0.4448, "lr": 4.1732372978155466e-08, "epoch": 19.259383378016086, "percentage": 96.3, "elapsed_time": "4:31:47", "remaining_time": "0:10:27", "throughput": 4085.65, "total_tokens": 66626872} +{"current_steps": 114945, "total_steps": 119360, "loss": 0.6148, "lr": 4.1638161740752415e-08, "epoch": 19.260221179624665, "percentage": 96.3, "elapsed_time": "4:31:48", "remaining_time": "0:10:26", "throughput": 4085.66, "total_tokens": 66629816} +{"current_steps": 114950, "total_steps": 119360, "loss": 0.7699, "lr": 4.154405652030624e-08, "epoch": 19.261058981233244, "percentage": 96.31, "elapsed_time": "4:31:48", "remaining_time": "0:10:25", "throughput": 4085.67, "total_tokens": 66633016} +{"current_steps": 114955, "total_steps": 119360, "loss": 0.4533, "lr": 4.145005731882812e-08, "epoch": 19.261896782841823, "percentage": 96.31, "elapsed_time": "4:31:49", "remaining_time": "0:10:24", "throughput": 4085.69, "total_tokens": 66636056} +{"current_steps": 114960, "total_steps": 119360, "loss": 0.4658, "lr": 4.135616413832755e-08, "epoch": 19.262734584450403, "percentage": 96.31, "elapsed_time": "4:31:50", "remaining_time": "0:10:24", "throughput": 4085.7, "total_tokens": 66639000} +{"current_steps": 114965, "total_steps": 119360, "loss": 0.3523, "lr": 4.1262376980812924e-08, "epoch": 19.263572386058982, "percentage": 96.32, "elapsed_time": "4:31:50", "remaining_time": "0:10:23", "throughput": 4085.7, "total_tokens": 66641624} +{"current_steps": 114970, "total_steps": 119360, "loss": 0.4446, "lr": 4.116869584828931e-08, "epoch": 19.26441018766756, "percentage": 96.32, "elapsed_time": "4:31:51", "remaining_time": "0:10:22", "throughput": 4085.71, "total_tokens": 66644472} +{"current_steps": 114975, "total_steps": 119360, "loss": 0.3623, "lr": 4.107512074275899e-08, "epoch": 19.26524798927614, "percentage": 96.33, "elapsed_time": "4:31:52", "remaining_time": "0:10:22", "throughput": 4085.72, "total_tokens": 66647416} +{"current_steps": 114980, "total_steps": 119360, "loss": 0.3025, "lr": 4.09816516662237e-08, "epoch": 19.26608579088472, "percentage": 96.33, "elapsed_time": "4:31:52", "remaining_time": "0:10:21", "throughput": 4085.73, "total_tokens": 66650360} +{"current_steps": 114985, "total_steps": 119360, "loss": 0.4873, "lr": 4.088828862068128e-08, "epoch": 19.2669235924933, "percentage": 96.33, "elapsed_time": "4:31:53", "remaining_time": "0:10:20", "throughput": 4085.73, "total_tokens": 66652952} +{"current_steps": 114990, "total_steps": 119360, "loss": 0.2835, "lr": 4.079503160812848e-08, "epoch": 19.26776139410188, "percentage": 96.34, "elapsed_time": "4:31:54", "remaining_time": "0:10:19", "throughput": 4085.74, "total_tokens": 66655768} +{"current_steps": 114995, "total_steps": 119360, "loss": 0.1838, "lr": 4.070188063055924e-08, "epoch": 19.268599195710454, "percentage": 96.34, "elapsed_time": "4:31:54", "remaining_time": "0:10:19", "throughput": 4085.75, "total_tokens": 66658776} +{"current_steps": 115000, "total_steps": 119360, "loss": 0.2967, "lr": 4.060883568996476e-08, "epoch": 19.269436997319033, "percentage": 96.35, "elapsed_time": "4:31:55", "remaining_time": "0:10:18", "throughput": 4085.76, "total_tokens": 66661592} +{"current_steps": 115005, "total_steps": 119360, "loss": 0.3692, "lr": 4.0515896788335116e-08, "epoch": 19.270274798927613, "percentage": 96.35, "elapsed_time": "4:31:56", "remaining_time": "0:10:17", "throughput": 4085.76, "total_tokens": 66664312} +{"current_steps": 115010, "total_steps": 119360, "loss": 0.327, "lr": 4.042306392765649e-08, "epoch": 19.271112600536192, "percentage": 96.36, "elapsed_time": "4:31:56", "remaining_time": "0:10:17", "throughput": 4085.77, "total_tokens": 66667064} +{"current_steps": 115015, "total_steps": 119360, "loss": 0.339, "lr": 4.0330337109915074e-08, "epoch": 19.27195040214477, "percentage": 96.36, "elapsed_time": "4:31:57", "remaining_time": "0:10:16", "throughput": 4085.78, "total_tokens": 66670072} +{"current_steps": 115020, "total_steps": 119360, "loss": 0.3221, "lr": 4.023771633709261e-08, "epoch": 19.27278820375335, "percentage": 96.36, "elapsed_time": "4:31:58", "remaining_time": "0:10:15", "throughput": 4085.79, "total_tokens": 66673176} +{"current_steps": 115025, "total_steps": 119360, "loss": 0.2839, "lr": 4.014520161116975e-08, "epoch": 19.27362600536193, "percentage": 96.37, "elapsed_time": "4:31:58", "remaining_time": "0:10:15", "throughput": 4085.8, "total_tokens": 66676088} +{"current_steps": 115030, "total_steps": 119360, "loss": 0.3064, "lr": 4.0052792934124896e-08, "epoch": 19.27446380697051, "percentage": 96.37, "elapsed_time": "4:31:59", "remaining_time": "0:10:14", "throughput": 4085.82, "total_tokens": 66679128} +{"current_steps": 115035, "total_steps": 119360, "loss": 0.2024, "lr": 3.996049030793314e-08, "epoch": 19.27530160857909, "percentage": 96.38, "elapsed_time": "4:32:00", "remaining_time": "0:10:13", "throughput": 4085.82, "total_tokens": 66681944} +{"current_steps": 115040, "total_steps": 119360, "loss": 0.5114, "lr": 3.9868293734568466e-08, "epoch": 19.276139410187668, "percentage": 96.38, "elapsed_time": "4:32:01", "remaining_time": "0:10:12", "throughput": 4085.83, "total_tokens": 66684920} +{"current_steps": 115045, "total_steps": 119360, "loss": 0.2069, "lr": 3.977620321600262e-08, "epoch": 19.276977211796247, "percentage": 96.38, "elapsed_time": "4:32:01", "remaining_time": "0:10:12", "throughput": 4085.84, "total_tokens": 66687800} +{"current_steps": 115050, "total_steps": 119360, "loss": 0.2545, "lr": 3.968421875420347e-08, "epoch": 19.277815013404826, "percentage": 96.39, "elapsed_time": "4:32:02", "remaining_time": "0:10:11", "throughput": 4085.85, "total_tokens": 66690712} +{"current_steps": 115055, "total_steps": 119360, "loss": 0.6101, "lr": 3.95923403511389e-08, "epoch": 19.278652815013405, "percentage": 96.39, "elapsed_time": "4:32:03", "remaining_time": "0:10:10", "throughput": 4085.86, "total_tokens": 66693656} +{"current_steps": 115060, "total_steps": 119360, "loss": 0.3878, "lr": 3.950056800877289e-08, "epoch": 19.279490616621985, "percentage": 96.4, "elapsed_time": "4:32:03", "remaining_time": "0:10:10", "throughput": 4085.87, "total_tokens": 66696632} +{"current_steps": 115065, "total_steps": 119360, "loss": 0.263, "lr": 3.940890172906775e-08, "epoch": 19.280328418230564, "percentage": 96.4, "elapsed_time": "4:32:04", "remaining_time": "0:10:09", "throughput": 4085.88, "total_tokens": 66699544} +{"current_steps": 115070, "total_steps": 119360, "loss": 0.3465, "lr": 3.9317341513983034e-08, "epoch": 19.281166219839143, "percentage": 96.41, "elapsed_time": "4:32:05", "remaining_time": "0:10:08", "throughput": 4085.89, "total_tokens": 66702488} +{"current_steps": 115075, "total_steps": 119360, "loss": 0.5005, "lr": 3.922588736547772e-08, "epoch": 19.282004021447722, "percentage": 96.41, "elapsed_time": "4:32:05", "remaining_time": "0:10:07", "throughput": 4085.9, "total_tokens": 66705592} +{"current_steps": 115080, "total_steps": 119360, "loss": 0.27, "lr": 3.913453928550581e-08, "epoch": 19.2828418230563, "percentage": 96.41, "elapsed_time": "4:32:06", "remaining_time": "0:10:07", "throughput": 4085.91, "total_tokens": 66708760} +{"current_steps": 115085, "total_steps": 119360, "loss": 0.4204, "lr": 3.904329727602074e-08, "epoch": 19.28367962466488, "percentage": 96.42, "elapsed_time": "4:32:07", "remaining_time": "0:10:06", "throughput": 4085.92, "total_tokens": 66711800} +{"current_steps": 115090, "total_steps": 119360, "loss": 0.3946, "lr": 3.895216133897428e-08, "epoch": 19.28451742627346, "percentage": 96.42, "elapsed_time": "4:32:07", "remaining_time": "0:10:05", "throughput": 4085.92, "total_tokens": 66714520} +{"current_steps": 115095, "total_steps": 119360, "loss": 0.3448, "lr": 3.886113147631376e-08, "epoch": 19.285355227882036, "percentage": 96.43, "elapsed_time": "4:32:08", "remaining_time": "0:10:05", "throughput": 4085.93, "total_tokens": 66717368} +{"current_steps": 115100, "total_steps": 119360, "loss": 0.289, "lr": 3.877020768998652e-08, "epoch": 19.286193029490615, "percentage": 96.43, "elapsed_time": "4:32:09", "remaining_time": "0:10:04", "throughput": 4085.94, "total_tokens": 66720440} +{"current_steps": 115105, "total_steps": 119360, "loss": 0.1803, "lr": 3.867938998193654e-08, "epoch": 19.287030831099194, "percentage": 96.44, "elapsed_time": "4:32:09", "remaining_time": "0:10:03", "throughput": 4085.95, "total_tokens": 66723320} +{"current_steps": 115110, "total_steps": 119360, "loss": 0.177, "lr": 3.858867835410507e-08, "epoch": 19.287868632707774, "percentage": 96.44, "elapsed_time": "4:32:10", "remaining_time": "0:10:02", "throughput": 4085.97, "total_tokens": 66726584} +{"current_steps": 115115, "total_steps": 119360, "loss": 0.3744, "lr": 3.849807280843221e-08, "epoch": 19.288706434316353, "percentage": 96.44, "elapsed_time": "4:32:11", "remaining_time": "0:10:02", "throughput": 4085.97, "total_tokens": 66729336} +{"current_steps": 115120, "total_steps": 119360, "loss": 0.4565, "lr": 3.8407573346855295e-08, "epoch": 19.289544235924932, "percentage": 96.45, "elapsed_time": "4:32:11", "remaining_time": "0:10:01", "throughput": 4085.98, "total_tokens": 66732152} +{"current_steps": 115125, "total_steps": 119360, "loss": 0.4125, "lr": 3.831717997130835e-08, "epoch": 19.29038203753351, "percentage": 96.45, "elapsed_time": "4:32:12", "remaining_time": "0:10:00", "throughput": 4085.99, "total_tokens": 66734936} +{"current_steps": 115130, "total_steps": 119360, "loss": 0.3461, "lr": 3.8226892683725366e-08, "epoch": 19.29121983914209, "percentage": 96.46, "elapsed_time": "4:32:13", "remaining_time": "0:10:00", "throughput": 4086.0, "total_tokens": 66737976} +{"current_steps": 115135, "total_steps": 119360, "loss": 0.3312, "lr": 3.8136711486035926e-08, "epoch": 19.29205764075067, "percentage": 96.46, "elapsed_time": "4:32:14", "remaining_time": "0:09:59", "throughput": 4086.02, "total_tokens": 66741528} +{"current_steps": 115140, "total_steps": 119360, "loss": 0.5605, "lr": 3.804663638016903e-08, "epoch": 19.29289544235925, "percentage": 96.46, "elapsed_time": "4:32:14", "remaining_time": "0:09:58", "throughput": 4086.03, "total_tokens": 66744376} +{"current_steps": 115145, "total_steps": 119360, "loss": 0.15, "lr": 3.7956667368049815e-08, "epoch": 19.29373324396783, "percentage": 96.47, "elapsed_time": "4:32:15", "remaining_time": "0:09:57", "throughput": 4086.03, "total_tokens": 66747224} +{"current_steps": 115150, "total_steps": 119360, "loss": 0.4564, "lr": 3.786680445160229e-08, "epoch": 19.294571045576408, "percentage": 96.47, "elapsed_time": "4:32:16", "remaining_time": "0:09:57", "throughput": 4086.05, "total_tokens": 66750392} +{"current_steps": 115155, "total_steps": 119360, "loss": 0.3384, "lr": 3.77770476327477e-08, "epoch": 19.295408847184987, "percentage": 96.48, "elapsed_time": "4:32:16", "remaining_time": "0:09:56", "throughput": 4086.06, "total_tokens": 66753144} +{"current_steps": 115160, "total_steps": 119360, "loss": 0.2783, "lr": 3.7687396913405614e-08, "epoch": 19.296246648793566, "percentage": 96.48, "elapsed_time": "4:32:17", "remaining_time": "0:09:55", "throughput": 4086.06, "total_tokens": 66755960} +{"current_steps": 115165, "total_steps": 119360, "loss": 0.4012, "lr": 3.759785229549284e-08, "epoch": 19.297084450402146, "percentage": 96.49, "elapsed_time": "4:32:18", "remaining_time": "0:09:55", "throughput": 4086.07, "total_tokens": 66758904} +{"current_steps": 115170, "total_steps": 119360, "loss": 0.404, "lr": 3.7508413780923406e-08, "epoch": 19.297922252010725, "percentage": 96.49, "elapsed_time": "4:32:18", "remaining_time": "0:09:54", "throughput": 4086.08, "total_tokens": 66762072} +{"current_steps": 115175, "total_steps": 119360, "loss": 0.2863, "lr": 3.741908137161021e-08, "epoch": 19.298760053619304, "percentage": 96.49, "elapsed_time": "4:32:19", "remaining_time": "0:09:53", "throughput": 4086.09, "total_tokens": 66765240} +{"current_steps": 115180, "total_steps": 119360, "loss": 0.2359, "lr": 3.7329855069463406e-08, "epoch": 19.299597855227884, "percentage": 96.5, "elapsed_time": "4:32:20", "remaining_time": "0:09:53", "throughput": 4086.1, "total_tokens": 66768152} +{"current_steps": 115185, "total_steps": 119360, "loss": 0.2032, "lr": 3.7240734876389796e-08, "epoch": 19.300435656836463, "percentage": 96.5, "elapsed_time": "4:32:21", "remaining_time": "0:09:52", "throughput": 4086.12, "total_tokens": 66771320} +{"current_steps": 115190, "total_steps": 119360, "loss": 0.2419, "lr": 3.7151720794295635e-08, "epoch": 19.30127345844504, "percentage": 96.51, "elapsed_time": "4:32:21", "remaining_time": "0:09:51", "throughput": 4086.13, "total_tokens": 66774424} +{"current_steps": 115195, "total_steps": 119360, "loss": 0.2876, "lr": 3.706281282508439e-08, "epoch": 19.302111260053618, "percentage": 96.51, "elapsed_time": "4:32:22", "remaining_time": "0:09:50", "throughput": 4086.15, "total_tokens": 66777400} +{"current_steps": 115200, "total_steps": 119360, "loss": 0.4393, "lr": 3.6974010970656784e-08, "epoch": 19.302949061662197, "percentage": 96.51, "elapsed_time": "4:32:23", "remaining_time": "0:09:50", "throughput": 4086.15, "total_tokens": 66780056} +{"current_steps": 115205, "total_steps": 119360, "loss": 0.262, "lr": 3.688531523291128e-08, "epoch": 19.303786863270776, "percentage": 96.52, "elapsed_time": "4:32:23", "remaining_time": "0:09:49", "throughput": 4086.16, "total_tokens": 66782968} +{"current_steps": 115210, "total_steps": 119360, "loss": 0.4728, "lr": 3.67967256137447e-08, "epoch": 19.304624664879356, "percentage": 96.52, "elapsed_time": "4:32:24", "remaining_time": "0:09:48", "throughput": 4086.17, "total_tokens": 66785752} +{"current_steps": 115215, "total_steps": 119360, "loss": 0.1476, "lr": 3.670824211505109e-08, "epoch": 19.305462466487935, "percentage": 96.53, "elapsed_time": "4:32:24", "remaining_time": "0:09:48", "throughput": 4086.17, "total_tokens": 66788440} +{"current_steps": 115220, "total_steps": 119360, "loss": 0.2393, "lr": 3.661986473872226e-08, "epoch": 19.306300268096514, "percentage": 96.53, "elapsed_time": "4:32:25", "remaining_time": "0:09:47", "throughput": 4086.18, "total_tokens": 66791320} +{"current_steps": 115225, "total_steps": 119360, "loss": 0.2272, "lr": 3.653159348664781e-08, "epoch": 19.307138069705093, "percentage": 96.54, "elapsed_time": "4:32:26", "remaining_time": "0:09:46", "throughput": 4086.19, "total_tokens": 66794232} +{"current_steps": 115230, "total_steps": 119360, "loss": 0.2518, "lr": 3.644342836071513e-08, "epoch": 19.307975871313673, "percentage": 96.54, "elapsed_time": "4:32:27", "remaining_time": "0:09:45", "throughput": 4086.2, "total_tokens": 66797336} +{"current_steps": 115235, "total_steps": 119360, "loss": 0.186, "lr": 3.6355369362809926e-08, "epoch": 19.308813672922252, "percentage": 96.54, "elapsed_time": "4:32:27", "remaining_time": "0:09:45", "throughput": 4086.22, "total_tokens": 66800504} +{"current_steps": 115240, "total_steps": 119360, "loss": 0.3579, "lr": 3.6267416494814026e-08, "epoch": 19.30965147453083, "percentage": 96.55, "elapsed_time": "4:32:28", "remaining_time": "0:09:44", "throughput": 4086.23, "total_tokens": 66803448} +{"current_steps": 115245, "total_steps": 119360, "loss": 0.3541, "lr": 3.617956975860815e-08, "epoch": 19.31048927613941, "percentage": 96.55, "elapsed_time": "4:32:29", "remaining_time": "0:09:43", "throughput": 4086.24, "total_tokens": 66806392} +{"current_steps": 115250, "total_steps": 119360, "loss": 0.2685, "lr": 3.6091829156071344e-08, "epoch": 19.31132707774799, "percentage": 96.56, "elapsed_time": "4:32:29", "remaining_time": "0:09:43", "throughput": 4086.25, "total_tokens": 66809304} +{"current_steps": 115255, "total_steps": 119360, "loss": 0.5391, "lr": 3.600419468907934e-08, "epoch": 19.31216487935657, "percentage": 96.56, "elapsed_time": "4:32:30", "remaining_time": "0:09:42", "throughput": 4086.25, "total_tokens": 66812088} +{"current_steps": 115260, "total_steps": 119360, "loss": 0.2056, "lr": 3.5916666359505634e-08, "epoch": 19.31300268096515, "percentage": 96.57, "elapsed_time": "4:32:31", "remaining_time": "0:09:41", "throughput": 4086.26, "total_tokens": 66814776} +{"current_steps": 115265, "total_steps": 119360, "loss": 0.2481, "lr": 3.5829244169221514e-08, "epoch": 19.313840482573728, "percentage": 96.57, "elapsed_time": "4:32:31", "remaining_time": "0:09:40", "throughput": 4086.26, "total_tokens": 66817400} +{"current_steps": 115270, "total_steps": 119360, "loss": 0.2925, "lr": 3.574192812009658e-08, "epoch": 19.314678284182307, "percentage": 96.57, "elapsed_time": "4:32:32", "remaining_time": "0:09:40", "throughput": 4086.27, "total_tokens": 66820504} +{"current_steps": 115275, "total_steps": 119360, "loss": 0.1412, "lr": 3.5654718213997686e-08, "epoch": 19.315516085790886, "percentage": 96.58, "elapsed_time": "4:32:33", "remaining_time": "0:09:39", "throughput": 4086.28, "total_tokens": 66823576} +{"current_steps": 115280, "total_steps": 119360, "loss": 0.6205, "lr": 3.556761445278944e-08, "epoch": 19.316353887399465, "percentage": 96.58, "elapsed_time": "4:32:33", "remaining_time": "0:09:38", "throughput": 4086.3, "total_tokens": 66826520} +{"current_steps": 115285, "total_steps": 119360, "loss": 0.3363, "lr": 3.5480616838334814e-08, "epoch": 19.317191689008045, "percentage": 96.59, "elapsed_time": "4:32:34", "remaining_time": "0:09:38", "throughput": 4086.31, "total_tokens": 66829688} +{"current_steps": 115290, "total_steps": 119360, "loss": 0.1671, "lr": 3.5393725372493413e-08, "epoch": 19.31802949061662, "percentage": 96.59, "elapsed_time": "4:32:35", "remaining_time": "0:09:37", "throughput": 4086.31, "total_tokens": 66832568} +{"current_steps": 115295, "total_steps": 119360, "loss": 0.2728, "lr": 3.530694005712265e-08, "epoch": 19.3188672922252, "percentage": 96.59, "elapsed_time": "4:32:35", "remaining_time": "0:09:36", "throughput": 4086.31, "total_tokens": 66835192} +{"current_steps": 115300, "total_steps": 119360, "loss": 0.2043, "lr": 3.5220260894078815e-08, "epoch": 19.31970509383378, "percentage": 96.6, "elapsed_time": "4:32:36", "remaining_time": "0:09:35", "throughput": 4086.33, "total_tokens": 66838200} +{"current_steps": 115305, "total_steps": 119360, "loss": 0.387, "lr": 3.5133687885214875e-08, "epoch": 19.320542895442358, "percentage": 96.6, "elapsed_time": "4:32:37", "remaining_time": "0:09:35", "throughput": 4086.34, "total_tokens": 66841400} +{"current_steps": 115310, "total_steps": 119360, "loss": 0.2059, "lr": 3.504722103238212e-08, "epoch": 19.321380697050937, "percentage": 96.61, "elapsed_time": "4:32:38", "remaining_time": "0:09:34", "throughput": 4086.36, "total_tokens": 66844728} +{"current_steps": 115315, "total_steps": 119360, "loss": 0.4412, "lr": 3.496086033742907e-08, "epoch": 19.322218498659517, "percentage": 96.61, "elapsed_time": "4:32:38", "remaining_time": "0:09:33", "throughput": 4086.37, "total_tokens": 66847960} +{"current_steps": 115320, "total_steps": 119360, "loss": 0.3644, "lr": 3.4874605802202586e-08, "epoch": 19.323056300268096, "percentage": 96.62, "elapsed_time": "4:32:39", "remaining_time": "0:09:33", "throughput": 4086.38, "total_tokens": 66850808} +{"current_steps": 115325, "total_steps": 119360, "loss": 0.325, "lr": 3.4788457428546754e-08, "epoch": 19.323894101876675, "percentage": 96.62, "elapsed_time": "4:32:40", "remaining_time": "0:09:32", "throughput": 4086.39, "total_tokens": 66853880} +{"current_steps": 115330, "total_steps": 119360, "loss": 0.3476, "lr": 3.4702415218303974e-08, "epoch": 19.324731903485254, "percentage": 96.62, "elapsed_time": "4:32:40", "remaining_time": "0:09:31", "throughput": 4086.4, "total_tokens": 66856696} +{"current_steps": 115335, "total_steps": 119360, "loss": 0.4979, "lr": 3.461647917331279e-08, "epoch": 19.325569705093834, "percentage": 96.63, "elapsed_time": "4:32:41", "remaining_time": "0:09:30", "throughput": 4086.42, "total_tokens": 66859768} +{"current_steps": 115340, "total_steps": 119360, "loss": 0.3001, "lr": 3.4530649295411724e-08, "epoch": 19.326407506702413, "percentage": 96.63, "elapsed_time": "4:32:42", "remaining_time": "0:09:30", "throughput": 4086.43, "total_tokens": 66862584} +{"current_steps": 115345, "total_steps": 119360, "loss": 0.1162, "lr": 3.444492558643542e-08, "epoch": 19.327245308310992, "percentage": 96.64, "elapsed_time": "4:32:42", "remaining_time": "0:09:29", "throughput": 4086.43, "total_tokens": 66865240} +{"current_steps": 115350, "total_steps": 119360, "loss": 0.2321, "lr": 3.4359308048216857e-08, "epoch": 19.32808310991957, "percentage": 96.64, "elapsed_time": "4:32:43", "remaining_time": "0:09:28", "throughput": 4086.44, "total_tokens": 66868152} +{"current_steps": 115355, "total_steps": 119360, "loss": 0.2533, "lr": 3.4273796682587345e-08, "epoch": 19.32892091152815, "percentage": 96.64, "elapsed_time": "4:32:44", "remaining_time": "0:09:28", "throughput": 4086.46, "total_tokens": 66871480} +{"current_steps": 115360, "total_steps": 119360, "loss": 0.3193, "lr": 3.418839149137376e-08, "epoch": 19.32975871313673, "percentage": 96.65, "elapsed_time": "4:32:44", "remaining_time": "0:09:27", "throughput": 4086.46, "total_tokens": 66874104} +{"current_steps": 115365, "total_steps": 119360, "loss": 0.2431, "lr": 3.410309247640353e-08, "epoch": 19.33059651474531, "percentage": 96.65, "elapsed_time": "4:32:45", "remaining_time": "0:09:26", "throughput": 4086.47, "total_tokens": 66877272} +{"current_steps": 115370, "total_steps": 119360, "loss": 0.1322, "lr": 3.40178996395002e-08, "epoch": 19.33143431635389, "percentage": 96.66, "elapsed_time": "4:32:46", "remaining_time": "0:09:26", "throughput": 4086.48, "total_tokens": 66880024} +{"current_steps": 115375, "total_steps": 119360, "loss": 0.1932, "lr": 3.393281298248507e-08, "epoch": 19.332272117962468, "percentage": 96.66, "elapsed_time": "4:32:46", "remaining_time": "0:09:25", "throughput": 4086.49, "total_tokens": 66882968} +{"current_steps": 115380, "total_steps": 119360, "loss": 0.2424, "lr": 3.384783250717727e-08, "epoch": 19.333109919571047, "percentage": 96.67, "elapsed_time": "4:32:47", "remaining_time": "0:09:24", "throughput": 4086.49, "total_tokens": 66885624} +{"current_steps": 115385, "total_steps": 119360, "loss": 0.2041, "lr": 3.3762958215394214e-08, "epoch": 19.333947721179626, "percentage": 96.67, "elapsed_time": "4:32:48", "remaining_time": "0:09:23", "throughput": 4086.51, "total_tokens": 66889208} +{"current_steps": 115390, "total_steps": 119360, "loss": 0.3528, "lr": 3.367819010895057e-08, "epoch": 19.334785522788202, "percentage": 96.67, "elapsed_time": "4:32:48", "remaining_time": "0:09:23", "throughput": 4086.52, "total_tokens": 66892152} +{"current_steps": 115395, "total_steps": 119360, "loss": 0.3182, "lr": 3.359352818965822e-08, "epoch": 19.33562332439678, "percentage": 96.68, "elapsed_time": "4:32:49", "remaining_time": "0:09:22", "throughput": 4086.53, "total_tokens": 66895064} +{"current_steps": 115400, "total_steps": 119360, "loss": 0.336, "lr": 3.350897245932794e-08, "epoch": 19.33646112600536, "percentage": 96.68, "elapsed_time": "4:32:50", "remaining_time": "0:09:21", "throughput": 4086.54, "total_tokens": 66897880} +{"current_steps": 115405, "total_steps": 119360, "loss": 0.3818, "lr": 3.342452291976772e-08, "epoch": 19.33729892761394, "percentage": 96.69, "elapsed_time": "4:32:50", "remaining_time": "0:09:21", "throughput": 4086.55, "total_tokens": 66900728} +{"current_steps": 115410, "total_steps": 119360, "loss": 0.4169, "lr": 3.33401795727828e-08, "epoch": 19.33813672922252, "percentage": 96.69, "elapsed_time": "4:32:51", "remaining_time": "0:09:20", "throughput": 4086.56, "total_tokens": 66903736} +{"current_steps": 115415, "total_steps": 119360, "loss": 0.3044, "lr": 3.325594242017727e-08, "epoch": 19.3389745308311, "percentage": 96.69, "elapsed_time": "4:32:52", "remaining_time": "0:09:19", "throughput": 4086.57, "total_tokens": 66906584} +{"current_steps": 115420, "total_steps": 119360, "loss": 0.2579, "lr": 3.317181146375137e-08, "epoch": 19.339812332439678, "percentage": 96.7, "elapsed_time": "4:32:52", "remaining_time": "0:09:18", "throughput": 4086.58, "total_tokens": 66909496} +{"current_steps": 115425, "total_steps": 119360, "loss": 0.5025, "lr": 3.3087786705304214e-08, "epoch": 19.340650134048257, "percentage": 96.7, "elapsed_time": "4:32:53", "remaining_time": "0:09:18", "throughput": 4086.58, "total_tokens": 66912344} +{"current_steps": 115430, "total_steps": 119360, "loss": 0.4799, "lr": 3.30038681466327e-08, "epoch": 19.341487935656836, "percentage": 96.71, "elapsed_time": "4:32:54", "remaining_time": "0:09:17", "throughput": 4086.59, "total_tokens": 66915288} +{"current_steps": 115435, "total_steps": 119360, "loss": 0.4334, "lr": 3.2920055789530945e-08, "epoch": 19.342325737265416, "percentage": 96.71, "elapsed_time": "4:32:55", "remaining_time": "0:09:16", "throughput": 4086.6, "total_tokens": 66918200} +{"current_steps": 115440, "total_steps": 119360, "loss": 0.2046, "lr": 3.28363496357903e-08, "epoch": 19.343163538873995, "percentage": 96.72, "elapsed_time": "4:32:55", "remaining_time": "0:09:16", "throughput": 4086.6, "total_tokens": 66920888} +{"current_steps": 115445, "total_steps": 119360, "loss": 0.3449, "lr": 3.27527496872021e-08, "epoch": 19.344001340482574, "percentage": 96.72, "elapsed_time": "4:32:56", "remaining_time": "0:09:15", "throughput": 4086.61, "total_tokens": 66923768} +{"current_steps": 115450, "total_steps": 119360, "loss": 0.3661, "lr": 3.2669255945552704e-08, "epoch": 19.344839142091153, "percentage": 96.72, "elapsed_time": "4:32:57", "remaining_time": "0:09:14", "throughput": 4086.63, "total_tokens": 66926904} +{"current_steps": 115455, "total_steps": 119360, "loss": 0.3647, "lr": 3.258586841262679e-08, "epoch": 19.345676943699733, "percentage": 96.73, "elapsed_time": "4:32:57", "remaining_time": "0:09:13", "throughput": 4086.63, "total_tokens": 66929432} +{"current_steps": 115460, "total_steps": 119360, "loss": 0.4302, "lr": 3.2502587090209036e-08, "epoch": 19.346514745308312, "percentage": 96.73, "elapsed_time": "4:32:58", "remaining_time": "0:09:13", "throughput": 4086.64, "total_tokens": 66932312} +{"current_steps": 115465, "total_steps": 119360, "loss": 0.1006, "lr": 3.2419411980078585e-08, "epoch": 19.34735254691689, "percentage": 96.74, "elapsed_time": "4:32:58", "remaining_time": "0:09:12", "throughput": 4086.64, "total_tokens": 66935064} +{"current_steps": 115470, "total_steps": 119360, "loss": 0.3306, "lr": 3.233634308401401e-08, "epoch": 19.34819034852547, "percentage": 96.74, "elapsed_time": "4:32:59", "remaining_time": "0:09:11", "throughput": 4086.65, "total_tokens": 66938008} +{"current_steps": 115475, "total_steps": 119360, "loss": 0.3603, "lr": 3.2253380403792226e-08, "epoch": 19.34902815013405, "percentage": 96.75, "elapsed_time": "4:33:00", "remaining_time": "0:09:11", "throughput": 4086.66, "total_tokens": 66940824} +{"current_steps": 115480, "total_steps": 119360, "loss": 0.1952, "lr": 3.21705239411868e-08, "epoch": 19.34986595174263, "percentage": 96.75, "elapsed_time": "4:33:00", "remaining_time": "0:09:10", "throughput": 4086.67, "total_tokens": 66943576} +{"current_steps": 115485, "total_steps": 119360, "loss": 0.1964, "lr": 3.208777369796912e-08, "epoch": 19.350703753351205, "percentage": 96.75, "elapsed_time": "4:33:01", "remaining_time": "0:09:09", "throughput": 4086.68, "total_tokens": 66946456} +{"current_steps": 115490, "total_steps": 119360, "loss": 0.3274, "lr": 3.200512967590885e-08, "epoch": 19.351541554959784, "percentage": 96.76, "elapsed_time": "4:33:02", "remaining_time": "0:09:08", "throughput": 4086.69, "total_tokens": 66949400} +{"current_steps": 115495, "total_steps": 119360, "loss": 0.3803, "lr": 3.192259187677238e-08, "epoch": 19.352379356568363, "percentage": 96.76, "elapsed_time": "4:33:03", "remaining_time": "0:09:08", "throughput": 4086.7, "total_tokens": 66952536} +{"current_steps": 115500, "total_steps": 119360, "loss": 0.2708, "lr": 3.184016030232495e-08, "epoch": 19.353217158176943, "percentage": 96.77, "elapsed_time": "4:33:03", "remaining_time": "0:09:07", "throughput": 4086.71, "total_tokens": 66955480} +{"current_steps": 115505, "total_steps": 119360, "loss": 0.4246, "lr": 3.1757834954329045e-08, "epoch": 19.354054959785522, "percentage": 96.77, "elapsed_time": "4:33:04", "remaining_time": "0:09:06", "throughput": 4086.72, "total_tokens": 66958488} +{"current_steps": 115510, "total_steps": 119360, "loss": 0.2444, "lr": 3.167561583454493e-08, "epoch": 19.3548927613941, "percentage": 96.77, "elapsed_time": "4:33:05", "remaining_time": "0:09:06", "throughput": 4086.74, "total_tokens": 66961528} +{"current_steps": 115515, "total_steps": 119360, "loss": 0.3655, "lr": 3.159350294473007e-08, "epoch": 19.35573056300268, "percentage": 96.78, "elapsed_time": "4:33:05", "remaining_time": "0:09:05", "throughput": 4086.75, "total_tokens": 66964728} +{"current_steps": 115520, "total_steps": 119360, "loss": 0.324, "lr": 3.1511496286641405e-08, "epoch": 19.35656836461126, "percentage": 96.78, "elapsed_time": "4:33:06", "remaining_time": "0:09:04", "throughput": 4086.76, "total_tokens": 66967704} +{"current_steps": 115525, "total_steps": 119360, "loss": 0.5773, "lr": 3.142959586203087e-08, "epoch": 19.35740616621984, "percentage": 96.79, "elapsed_time": "4:33:07", "remaining_time": "0:09:03", "throughput": 4086.76, "total_tokens": 66970552} +{"current_steps": 115530, "total_steps": 119360, "loss": 0.3251, "lr": 3.134780167265039e-08, "epoch": 19.358243967828418, "percentage": 96.79, "elapsed_time": "4:33:07", "remaining_time": "0:09:03", "throughput": 4086.78, "total_tokens": 66973624} +{"current_steps": 115535, "total_steps": 119360, "loss": 0.41, "lr": 3.126611372024857e-08, "epoch": 19.359081769436997, "percentage": 96.8, "elapsed_time": "4:33:08", "remaining_time": "0:09:02", "throughput": 4086.78, "total_tokens": 66976376} +{"current_steps": 115540, "total_steps": 119360, "loss": 0.4458, "lr": 3.11845320065729e-08, "epoch": 19.359919571045577, "percentage": 96.8, "elapsed_time": "4:33:09", "remaining_time": "0:09:01", "throughput": 4086.78, "total_tokens": 66979096} +{"current_steps": 115545, "total_steps": 119360, "loss": 0.3945, "lr": 3.1103056533366425e-08, "epoch": 19.360757372654156, "percentage": 96.8, "elapsed_time": "4:33:09", "remaining_time": "0:09:01", "throughput": 4086.78, "total_tokens": 66981688} +{"current_steps": 115550, "total_steps": 119360, "loss": 0.5453, "lr": 3.102168730237221e-08, "epoch": 19.361595174262735, "percentage": 96.81, "elapsed_time": "4:33:10", "remaining_time": "0:09:00", "throughput": 4086.8, "total_tokens": 66984888} +{"current_steps": 115555, "total_steps": 119360, "loss": 0.4835, "lr": 3.094042431532884e-08, "epoch": 19.362432975871315, "percentage": 96.81, "elapsed_time": "4:33:11", "remaining_time": "0:08:59", "throughput": 4086.8, "total_tokens": 66987736} +{"current_steps": 115560, "total_steps": 119360, "loss": 0.2948, "lr": 3.085926757397495e-08, "epoch": 19.363270777479894, "percentage": 96.82, "elapsed_time": "4:33:11", "remaining_time": "0:08:59", "throughput": 4086.81, "total_tokens": 66990424} +{"current_steps": 115565, "total_steps": 119360, "loss": 0.2336, "lr": 3.0778217080045804e-08, "epoch": 19.364108579088473, "percentage": 96.82, "elapsed_time": "4:33:12", "remaining_time": "0:08:58", "throughput": 4086.81, "total_tokens": 66993208} +{"current_steps": 115570, "total_steps": 119360, "loss": 0.3283, "lr": 3.069727283527391e-08, "epoch": 19.364946380697052, "percentage": 96.82, "elapsed_time": "4:33:13", "remaining_time": "0:08:57", "throughput": 4086.82, "total_tokens": 66995928} +{"current_steps": 115575, "total_steps": 119360, "loss": 0.3709, "lr": 3.0616434841389544e-08, "epoch": 19.36578418230563, "percentage": 96.83, "elapsed_time": "4:33:13", "remaining_time": "0:08:56", "throughput": 4086.83, "total_tokens": 66998680} +{"current_steps": 115580, "total_steps": 119360, "loss": 0.2326, "lr": 3.0535703100122435e-08, "epoch": 19.36662198391421, "percentage": 96.83, "elapsed_time": "4:33:14", "remaining_time": "0:08:56", "throughput": 4086.84, "total_tokens": 67001464} +{"current_steps": 115585, "total_steps": 119360, "loss": 0.3939, "lr": 3.0455077613197325e-08, "epoch": 19.367459785522787, "percentage": 96.84, "elapsed_time": "4:33:15", "remaining_time": "0:08:55", "throughput": 4086.84, "total_tokens": 67004312} +{"current_steps": 115590, "total_steps": 119360, "loss": 0.5145, "lr": 3.037455838233949e-08, "epoch": 19.368297587131366, "percentage": 96.84, "elapsed_time": "4:33:15", "remaining_time": "0:08:54", "throughput": 4086.85, "total_tokens": 67007256} +{"current_steps": 115595, "total_steps": 119360, "loss": 0.4413, "lr": 3.0294145409269224e-08, "epoch": 19.369135388739945, "percentage": 96.85, "elapsed_time": "4:33:16", "remaining_time": "0:08:54", "throughput": 4086.85, "total_tokens": 67009848} +{"current_steps": 115600, "total_steps": 119360, "loss": 0.1264, "lr": 3.021383869570682e-08, "epoch": 19.369973190348524, "percentage": 96.85, "elapsed_time": "4:33:17", "remaining_time": "0:08:53", "throughput": 4086.87, "total_tokens": 67013080} +{"current_steps": 115605, "total_steps": 119360, "loss": 0.3612, "lr": 3.013363824336868e-08, "epoch": 19.370810991957104, "percentage": 96.85, "elapsed_time": "4:33:17", "remaining_time": "0:08:52", "throughput": 4086.87, "total_tokens": 67015928} +{"current_steps": 115610, "total_steps": 119360, "loss": 0.3363, "lr": 3.005354405397065e-08, "epoch": 19.371648793565683, "percentage": 96.86, "elapsed_time": "4:33:18", "remaining_time": "0:08:51", "throughput": 4086.88, "total_tokens": 67018680} +{"current_steps": 115615, "total_steps": 119360, "loss": 0.4853, "lr": 2.997355612922359e-08, "epoch": 19.372486595174262, "percentage": 96.86, "elapsed_time": "4:33:19", "remaining_time": "0:08:51", "throughput": 4086.89, "total_tokens": 67021784} +{"current_steps": 115620, "total_steps": 119360, "loss": 0.3727, "lr": 2.989367447083946e-08, "epoch": 19.37332439678284, "percentage": 96.87, "elapsed_time": "4:33:19", "remaining_time": "0:08:50", "throughput": 4086.9, "total_tokens": 67024568} +{"current_steps": 115625, "total_steps": 119360, "loss": 0.3076, "lr": 2.9813899080525234e-08, "epoch": 19.37416219839142, "percentage": 96.87, "elapsed_time": "4:33:20", "remaining_time": "0:08:49", "throughput": 4086.91, "total_tokens": 67027608} +{"current_steps": 115630, "total_steps": 119360, "loss": 0.2516, "lr": 2.973422995998676e-08, "epoch": 19.375, "percentage": 96.88, "elapsed_time": "4:33:21", "remaining_time": "0:08:49", "throughput": 4086.92, "total_tokens": 67030424} +{"current_steps": 115635, "total_steps": 119360, "loss": 0.2838, "lr": 2.9654667110927683e-08, "epoch": 19.37583780160858, "percentage": 96.88, "elapsed_time": "4:33:21", "remaining_time": "0:08:48", "throughput": 4086.93, "total_tokens": 67033464} +{"current_steps": 115640, "total_steps": 119360, "loss": 0.3461, "lr": 2.9575210535048858e-08, "epoch": 19.37667560321716, "percentage": 96.88, "elapsed_time": "4:33:22", "remaining_time": "0:08:47", "throughput": 4086.94, "total_tokens": 67036312} +{"current_steps": 115645, "total_steps": 119360, "loss": 0.2291, "lr": 2.949586023404949e-08, "epoch": 19.377513404825738, "percentage": 96.89, "elapsed_time": "4:33:23", "remaining_time": "0:08:46", "throughput": 4086.95, "total_tokens": 67039224} +{"current_steps": 115650, "total_steps": 119360, "loss": 0.483, "lr": 2.9416616209626547e-08, "epoch": 19.378351206434317, "percentage": 96.89, "elapsed_time": "4:33:23", "remaining_time": "0:08:46", "throughput": 4086.96, "total_tokens": 67042136} +{"current_steps": 115655, "total_steps": 119360, "loss": 0.5428, "lr": 2.9337478463474234e-08, "epoch": 19.379189008042896, "percentage": 96.9, "elapsed_time": "4:33:24", "remaining_time": "0:08:45", "throughput": 4086.96, "total_tokens": 67044792} +{"current_steps": 115660, "total_steps": 119360, "loss": 0.2831, "lr": 2.925844699728342e-08, "epoch": 19.380026809651476, "percentage": 96.9, "elapsed_time": "4:33:25", "remaining_time": "0:08:44", "throughput": 4086.97, "total_tokens": 67047576} +{"current_steps": 115665, "total_steps": 119360, "loss": 0.8373, "lr": 2.9179521812745527e-08, "epoch": 19.380864611260055, "percentage": 96.9, "elapsed_time": "4:33:25", "remaining_time": "0:08:44", "throughput": 4086.97, "total_tokens": 67050328} +{"current_steps": 115670, "total_steps": 119360, "loss": 0.3384, "lr": 2.9100702911546985e-08, "epoch": 19.381702412868634, "percentage": 96.91, "elapsed_time": "4:33:26", "remaining_time": "0:08:43", "throughput": 4086.98, "total_tokens": 67053464} +{"current_steps": 115675, "total_steps": 119360, "loss": 0.3385, "lr": 2.902199029537367e-08, "epoch": 19.382540214477213, "percentage": 96.91, "elapsed_time": "4:33:27", "remaining_time": "0:08:42", "throughput": 4087.0, "total_tokens": 67056472} +{"current_steps": 115680, "total_steps": 119360, "loss": 0.5393, "lr": 2.8943383965908677e-08, "epoch": 19.38337801608579, "percentage": 96.92, "elapsed_time": "4:33:27", "remaining_time": "0:08:41", "throughput": 4087.01, "total_tokens": 67059416} +{"current_steps": 115685, "total_steps": 119360, "loss": 0.48, "lr": 2.886488392483233e-08, "epoch": 19.38421581769437, "percentage": 96.92, "elapsed_time": "4:33:28", "remaining_time": "0:08:41", "throughput": 4087.02, "total_tokens": 67062392} +{"current_steps": 115690, "total_steps": 119360, "loss": 0.2711, "lr": 2.8786490173822736e-08, "epoch": 19.385053619302948, "percentage": 96.93, "elapsed_time": "4:33:29", "remaining_time": "0:08:40", "throughput": 4087.03, "total_tokens": 67065496} +{"current_steps": 115695, "total_steps": 119360, "loss": 0.3588, "lr": 2.8708202714556878e-08, "epoch": 19.385891420911527, "percentage": 96.93, "elapsed_time": "4:33:29", "remaining_time": "0:08:39", "throughput": 4087.03, "total_tokens": 67068184} +{"current_steps": 115700, "total_steps": 119360, "loss": 0.1897, "lr": 2.863002154870842e-08, "epoch": 19.386729222520106, "percentage": 96.93, "elapsed_time": "4:33:30", "remaining_time": "0:08:39", "throughput": 4087.05, "total_tokens": 67071160} +{"current_steps": 115705, "total_steps": 119360, "loss": 0.2276, "lr": 2.8551946677948805e-08, "epoch": 19.387567024128685, "percentage": 96.94, "elapsed_time": "4:33:31", "remaining_time": "0:08:38", "throughput": 4087.06, "total_tokens": 67074360} +{"current_steps": 115710, "total_steps": 119360, "loss": 0.1166, "lr": 2.847397810394725e-08, "epoch": 19.388404825737265, "percentage": 96.94, "elapsed_time": "4:33:32", "remaining_time": "0:08:37", "throughput": 4087.07, "total_tokens": 67077432} +{"current_steps": 115715, "total_steps": 119360, "loss": 0.4269, "lr": 2.8396115828371318e-08, "epoch": 19.389242627345844, "percentage": 96.95, "elapsed_time": "4:33:32", "remaining_time": "0:08:37", "throughput": 4087.08, "total_tokens": 67080600} +{"current_steps": 115720, "total_steps": 119360, "loss": 0.4707, "lr": 2.8318359852885225e-08, "epoch": 19.390080428954423, "percentage": 96.95, "elapsed_time": "4:33:33", "remaining_time": "0:08:36", "throughput": 4087.1, "total_tokens": 67083672} +{"current_steps": 115725, "total_steps": 119360, "loss": 0.3949, "lr": 2.8240710179151533e-08, "epoch": 19.390918230563003, "percentage": 96.95, "elapsed_time": "4:33:34", "remaining_time": "0:08:35", "throughput": 4087.12, "total_tokens": 67086968} +{"current_steps": 115730, "total_steps": 119360, "loss": 0.259, "lr": 2.816316680883113e-08, "epoch": 19.391756032171582, "percentage": 96.96, "elapsed_time": "4:33:34", "remaining_time": "0:08:34", "throughput": 4087.13, "total_tokens": 67090008} +{"current_steps": 115735, "total_steps": 119360, "loss": 0.4356, "lr": 2.808572974358159e-08, "epoch": 19.39259383378016, "percentage": 96.96, "elapsed_time": "4:33:35", "remaining_time": "0:08:34", "throughput": 4087.14, "total_tokens": 67092952} +{"current_steps": 115740, "total_steps": 119360, "loss": 0.284, "lr": 2.8008398985058805e-08, "epoch": 19.39343163538874, "percentage": 96.97, "elapsed_time": "4:33:36", "remaining_time": "0:08:33", "throughput": 4087.15, "total_tokens": 67095928} +{"current_steps": 115745, "total_steps": 119360, "loss": 0.3995, "lr": 2.793117453491645e-08, "epoch": 19.39426943699732, "percentage": 96.97, "elapsed_time": "4:33:36", "remaining_time": "0:08:32", "throughput": 4087.15, "total_tokens": 67098616} +{"current_steps": 115750, "total_steps": 119360, "loss": 0.2719, "lr": 2.7854056394804873e-08, "epoch": 19.3951072386059, "percentage": 96.98, "elapsed_time": "4:33:37", "remaining_time": "0:08:32", "throughput": 4087.16, "total_tokens": 67101272} +{"current_steps": 115755, "total_steps": 119360, "loss": 0.2855, "lr": 2.7777044566373314e-08, "epoch": 19.395945040214478, "percentage": 96.98, "elapsed_time": "4:33:38", "remaining_time": "0:08:31", "throughput": 4087.17, "total_tokens": 67104408} +{"current_steps": 115760, "total_steps": 119360, "loss": 0.1851, "lr": 2.7700139051269337e-08, "epoch": 19.396782841823057, "percentage": 96.98, "elapsed_time": "4:33:38", "remaining_time": "0:08:30", "throughput": 4087.18, "total_tokens": 67107320} +{"current_steps": 115765, "total_steps": 119360, "loss": 0.3051, "lr": 2.7623339851135522e-08, "epoch": 19.397620643431637, "percentage": 96.99, "elapsed_time": "4:33:39", "remaining_time": "0:08:29", "throughput": 4087.19, "total_tokens": 67110136} +{"current_steps": 115770, "total_steps": 119360, "loss": 0.4707, "lr": 2.7546646967614997e-08, "epoch": 19.398458445040216, "percentage": 96.99, "elapsed_time": "4:33:40", "remaining_time": "0:08:29", "throughput": 4087.2, "total_tokens": 67113112} +{"current_steps": 115775, "total_steps": 119360, "loss": 0.2898, "lr": 2.747006040234812e-08, "epoch": 19.399296246648795, "percentage": 97.0, "elapsed_time": "4:33:41", "remaining_time": "0:08:28", "throughput": 4087.22, "total_tokens": 67116376} +{"current_steps": 115780, "total_steps": 119360, "loss": 0.4041, "lr": 2.7393580156971357e-08, "epoch": 19.40013404825737, "percentage": 97.0, "elapsed_time": "4:33:41", "remaining_time": "0:08:27", "throughput": 4087.23, "total_tokens": 67119512} +{"current_steps": 115785, "total_steps": 119360, "loss": 0.2952, "lr": 2.7317206233120618e-08, "epoch": 19.40097184986595, "percentage": 97.0, "elapsed_time": "4:33:42", "remaining_time": "0:08:27", "throughput": 4087.24, "total_tokens": 67122456} +{"current_steps": 115790, "total_steps": 119360, "loss": 0.4568, "lr": 2.7240938632428493e-08, "epoch": 19.40180965147453, "percentage": 97.01, "elapsed_time": "4:33:43", "remaining_time": "0:08:26", "throughput": 4087.25, "total_tokens": 67125528} +{"current_steps": 115795, "total_steps": 119360, "loss": 0.337, "lr": 2.716477735652645e-08, "epoch": 19.40264745308311, "percentage": 97.01, "elapsed_time": "4:33:43", "remaining_time": "0:08:25", "throughput": 4087.27, "total_tokens": 67128504} +{"current_steps": 115800, "total_steps": 119360, "loss": 0.3023, "lr": 2.7088722407041523e-08, "epoch": 19.403485254691688, "percentage": 97.02, "elapsed_time": "4:33:44", "remaining_time": "0:08:24", "throughput": 4087.28, "total_tokens": 67131320} +{"current_steps": 115805, "total_steps": 119360, "loss": 0.3714, "lr": 2.70127737856013e-08, "epoch": 19.404323056300267, "percentage": 97.02, "elapsed_time": "4:33:45", "remaining_time": "0:08:24", "throughput": 4087.28, "total_tokens": 67133848} +{"current_steps": 115810, "total_steps": 119360, "loss": 0.4032, "lr": 2.6936931493828367e-08, "epoch": 19.405160857908847, "percentage": 97.03, "elapsed_time": "4:33:45", "remaining_time": "0:08:23", "throughput": 4087.28, "total_tokens": 67136440} +{"current_steps": 115815, "total_steps": 119360, "loss": 0.2752, "lr": 2.6861195533345873e-08, "epoch": 19.405998659517426, "percentage": 97.03, "elapsed_time": "4:33:46", "remaining_time": "0:08:22", "throughput": 4087.29, "total_tokens": 67139512} +{"current_steps": 115820, "total_steps": 119360, "loss": 0.3686, "lr": 2.6785565905771972e-08, "epoch": 19.406836461126005, "percentage": 97.03, "elapsed_time": "4:33:47", "remaining_time": "0:08:22", "throughput": 4087.29, "total_tokens": 67142232} +{"current_steps": 115825, "total_steps": 119360, "loss": 0.6221, "lr": 2.671004261272425e-08, "epoch": 19.407674262734584, "percentage": 97.04, "elapsed_time": "4:33:47", "remaining_time": "0:08:21", "throughput": 4087.3, "total_tokens": 67145112} +{"current_steps": 115830, "total_steps": 119360, "loss": 0.599, "lr": 2.6634625655816983e-08, "epoch": 19.408512064343164, "percentage": 97.04, "elapsed_time": "4:33:48", "remaining_time": "0:08:20", "throughput": 4087.31, "total_tokens": 67147800} +{"current_steps": 115835, "total_steps": 119360, "loss": 0.4675, "lr": 2.6559315036663313e-08, "epoch": 19.409349865951743, "percentage": 97.05, "elapsed_time": "4:33:49", "remaining_time": "0:08:19", "throughput": 4087.31, "total_tokens": 67150488} +{"current_steps": 115840, "total_steps": 119360, "loss": 0.2642, "lr": 2.6484110756873072e-08, "epoch": 19.410187667560322, "percentage": 97.05, "elapsed_time": "4:33:49", "remaining_time": "0:08:19", "throughput": 4087.32, "total_tokens": 67153592} +{"current_steps": 115845, "total_steps": 119360, "loss": 0.4818, "lr": 2.6409012818054414e-08, "epoch": 19.4110254691689, "percentage": 97.06, "elapsed_time": "4:33:50", "remaining_time": "0:08:18", "throughput": 4087.33, "total_tokens": 67156344} +{"current_steps": 115850, "total_steps": 119360, "loss": 0.3751, "lr": 2.633402122181328e-08, "epoch": 19.41186327077748, "percentage": 97.06, "elapsed_time": "4:33:51", "remaining_time": "0:08:17", "throughput": 4087.33, "total_tokens": 67159032} +{"current_steps": 115855, "total_steps": 119360, "loss": 0.4669, "lr": 2.6259135969752825e-08, "epoch": 19.41270107238606, "percentage": 97.06, "elapsed_time": "4:33:51", "remaining_time": "0:08:17", "throughput": 4087.34, "total_tokens": 67161848} +{"current_steps": 115860, "total_steps": 119360, "loss": 0.2087, "lr": 2.6184357063473998e-08, "epoch": 19.41353887399464, "percentage": 97.07, "elapsed_time": "4:33:52", "remaining_time": "0:08:16", "throughput": 4087.34, "total_tokens": 67164600} +{"current_steps": 115865, "total_steps": 119360, "loss": 0.4032, "lr": 2.6109684504576625e-08, "epoch": 19.41437667560322, "percentage": 97.07, "elapsed_time": "4:33:53", "remaining_time": "0:08:15", "throughput": 4087.36, "total_tokens": 67167672} +{"current_steps": 115870, "total_steps": 119360, "loss": 0.2563, "lr": 2.6035118294655547e-08, "epoch": 19.415214477211798, "percentage": 97.08, "elapsed_time": "4:33:53", "remaining_time": "0:08:14", "throughput": 4087.37, "total_tokens": 67171000} +{"current_steps": 115875, "total_steps": 119360, "loss": 0.3215, "lr": 2.5960658435306706e-08, "epoch": 19.416052278820374, "percentage": 97.08, "elapsed_time": "4:33:54", "remaining_time": "0:08:14", "throughput": 4087.38, "total_tokens": 67173880} +{"current_steps": 115880, "total_steps": 119360, "loss": 0.212, "lr": 2.5886304928121607e-08, "epoch": 19.416890080428953, "percentage": 97.08, "elapsed_time": "4:33:55", "remaining_time": "0:08:13", "throughput": 4087.39, "total_tokens": 67176728} +{"current_steps": 115885, "total_steps": 119360, "loss": 0.4082, "lr": 2.581205777469009e-08, "epoch": 19.417727882037532, "percentage": 97.09, "elapsed_time": "4:33:55", "remaining_time": "0:08:12", "throughput": 4087.4, "total_tokens": 67179544} +{"current_steps": 115890, "total_steps": 119360, "loss": 0.4449, "lr": 2.5737916976599774e-08, "epoch": 19.41856568364611, "percentage": 97.09, "elapsed_time": "4:33:56", "remaining_time": "0:08:12", "throughput": 4087.4, "total_tokens": 67182392} +{"current_steps": 115895, "total_steps": 119360, "loss": 0.1939, "lr": 2.5663882535434946e-08, "epoch": 19.41940348525469, "percentage": 97.1, "elapsed_time": "4:33:57", "remaining_time": "0:08:11", "throughput": 4087.41, "total_tokens": 67185432} +{"current_steps": 115900, "total_steps": 119360, "loss": 0.3743, "lr": 2.5589954452779898e-08, "epoch": 19.42024128686327, "percentage": 97.1, "elapsed_time": "4:33:57", "remaining_time": "0:08:10", "throughput": 4087.42, "total_tokens": 67188312} +{"current_steps": 115905, "total_steps": 119360, "loss": 0.17, "lr": 2.5516132730215028e-08, "epoch": 19.42107908847185, "percentage": 97.11, "elapsed_time": "4:33:58", "remaining_time": "0:08:10", "throughput": 4087.44, "total_tokens": 67191512} +{"current_steps": 115910, "total_steps": 119360, "loss": 0.2506, "lr": 2.5442417369318516e-08, "epoch": 19.42191689008043, "percentage": 97.11, "elapsed_time": "4:33:59", "remaining_time": "0:08:09", "throughput": 4087.44, "total_tokens": 67194424} +{"current_steps": 115915, "total_steps": 119360, "loss": 0.3262, "lr": 2.5368808371665777e-08, "epoch": 19.422754691689008, "percentage": 97.11, "elapsed_time": "4:33:59", "remaining_time": "0:08:08", "throughput": 4087.45, "total_tokens": 67197400} +{"current_steps": 115920, "total_steps": 119360, "loss": 0.2583, "lr": 2.529530573883221e-08, "epoch": 19.423592493297587, "percentage": 97.12, "elapsed_time": "4:34:00", "remaining_time": "0:08:07", "throughput": 4087.46, "total_tokens": 67200024} +{"current_steps": 115925, "total_steps": 119360, "loss": 0.3568, "lr": 2.522190947238823e-08, "epoch": 19.424430294906166, "percentage": 97.12, "elapsed_time": "4:34:01", "remaining_time": "0:08:07", "throughput": 4087.47, "total_tokens": 67202872} +{"current_steps": 115930, "total_steps": 119360, "loss": 0.1837, "lr": 2.5148619573903686e-08, "epoch": 19.425268096514746, "percentage": 97.13, "elapsed_time": "4:34:01", "remaining_time": "0:08:06", "throughput": 4087.47, "total_tokens": 67205560} +{"current_steps": 115935, "total_steps": 119360, "loss": 0.3899, "lr": 2.507543604494511e-08, "epoch": 19.426105898123325, "percentage": 97.13, "elapsed_time": "4:34:02", "remaining_time": "0:08:05", "throughput": 4087.48, "total_tokens": 67208440} +{"current_steps": 115940, "total_steps": 119360, "loss": 0.3881, "lr": 2.5002358887077915e-08, "epoch": 19.426943699731904, "percentage": 97.13, "elapsed_time": "4:34:03", "remaining_time": "0:08:05", "throughput": 4087.49, "total_tokens": 67211256} +{"current_steps": 115945, "total_steps": 119360, "loss": 0.3612, "lr": 2.492938810186418e-08, "epoch": 19.427781501340483, "percentage": 97.14, "elapsed_time": "4:34:03", "remaining_time": "0:08:04", "throughput": 4087.5, "total_tokens": 67214264} +{"current_steps": 115950, "total_steps": 119360, "loss": 0.1644, "lr": 2.485652369086433e-08, "epoch": 19.428619302949063, "percentage": 97.14, "elapsed_time": "4:34:04", "remaining_time": "0:08:03", "throughput": 4087.5, "total_tokens": 67216920} +{"current_steps": 115955, "total_steps": 119360, "loss": 0.3503, "lr": 2.4783765655636006e-08, "epoch": 19.429457104557642, "percentage": 97.15, "elapsed_time": "4:34:05", "remaining_time": "0:08:02", "throughput": 4087.51, "total_tokens": 67219736} +{"current_steps": 115960, "total_steps": 119360, "loss": 0.2933, "lr": 2.471111399773518e-08, "epoch": 19.43029490616622, "percentage": 97.15, "elapsed_time": "4:34:05", "remaining_time": "0:08:02", "throughput": 4087.51, "total_tokens": 67222552} +{"current_steps": 115965, "total_steps": 119360, "loss": 0.4363, "lr": 2.4638568718715616e-08, "epoch": 19.4311327077748, "percentage": 97.16, "elapsed_time": "4:34:06", "remaining_time": "0:08:01", "throughput": 4087.52, "total_tokens": 67225368} +{"current_steps": 115970, "total_steps": 119360, "loss": 0.2173, "lr": 2.4566129820127738e-08, "epoch": 19.43197050938338, "percentage": 97.16, "elapsed_time": "4:34:07", "remaining_time": "0:08:00", "throughput": 4087.52, "total_tokens": 67227896} +{"current_steps": 115975, "total_steps": 119360, "loss": 0.2927, "lr": 2.4493797303520306e-08, "epoch": 19.432808310991955, "percentage": 97.16, "elapsed_time": "4:34:07", "remaining_time": "0:08:00", "throughput": 4087.53, "total_tokens": 67230680} +{"current_steps": 115980, "total_steps": 119360, "loss": 0.4325, "lr": 2.4421571170440417e-08, "epoch": 19.433646112600535, "percentage": 97.17, "elapsed_time": "4:34:08", "remaining_time": "0:07:59", "throughput": 4087.54, "total_tokens": 67233688} +{"current_steps": 115985, "total_steps": 119360, "loss": 0.2883, "lr": 2.434945142243239e-08, "epoch": 19.434483914209114, "percentage": 97.17, "elapsed_time": "4:34:09", "remaining_time": "0:07:58", "throughput": 4087.55, "total_tokens": 67236376} +{"current_steps": 115990, "total_steps": 119360, "loss": 0.2603, "lr": 2.4277438061037773e-08, "epoch": 19.435321715817693, "percentage": 97.18, "elapsed_time": "4:34:09", "remaining_time": "0:07:57", "throughput": 4087.56, "total_tokens": 67239352} +{"current_steps": 115995, "total_steps": 119360, "loss": 0.2448, "lr": 2.4205531087796442e-08, "epoch": 19.436159517426272, "percentage": 97.18, "elapsed_time": "4:34:10", "remaining_time": "0:07:57", "throughput": 4087.57, "total_tokens": 67242424} +{"current_steps": 116000, "total_steps": 119360, "loss": 0.4737, "lr": 2.413373050424661e-08, "epoch": 19.43699731903485, "percentage": 97.18, "elapsed_time": "4:34:11", "remaining_time": "0:07:56", "throughput": 4087.59, "total_tokens": 67245464} +{"current_steps": 116005, "total_steps": 119360, "loss": 0.497, "lr": 2.4062036311922608e-08, "epoch": 19.43783512064343, "percentage": 97.19, "elapsed_time": "4:34:11", "remaining_time": "0:07:55", "throughput": 4087.59, "total_tokens": 67248344} +{"current_steps": 116010, "total_steps": 119360, "loss": 0.1107, "lr": 2.3990448512357656e-08, "epoch": 19.43867292225201, "percentage": 97.19, "elapsed_time": "4:34:12", "remaining_time": "0:07:55", "throughput": 4087.6, "total_tokens": 67251256} +{"current_steps": 116015, "total_steps": 119360, "loss": 0.3788, "lr": 2.3918967107082193e-08, "epoch": 19.43951072386059, "percentage": 97.2, "elapsed_time": "4:34:13", "remaining_time": "0:07:54", "throughput": 4087.61, "total_tokens": 67254136} +{"current_steps": 116020, "total_steps": 119360, "loss": 0.2789, "lr": 2.3847592097624993e-08, "epoch": 19.44034852546917, "percentage": 97.2, "elapsed_time": "4:34:13", "remaining_time": "0:07:53", "throughput": 4087.61, "total_tokens": 67256920} +{"current_steps": 116025, "total_steps": 119360, "loss": 0.4161, "lr": 2.3776323485512063e-08, "epoch": 19.441186327077748, "percentage": 97.21, "elapsed_time": "4:34:14", "remaining_time": "0:07:52", "throughput": 4087.63, "total_tokens": 67260024} +{"current_steps": 116030, "total_steps": 119360, "loss": 0.2137, "lr": 2.3705161272267185e-08, "epoch": 19.442024128686327, "percentage": 97.21, "elapsed_time": "4:34:15", "remaining_time": "0:07:52", "throughput": 4087.63, "total_tokens": 67262904} +{"current_steps": 116035, "total_steps": 119360, "loss": 0.5264, "lr": 2.363410545941136e-08, "epoch": 19.442861930294907, "percentage": 97.21, "elapsed_time": "4:34:15", "remaining_time": "0:07:51", "throughput": 4087.64, "total_tokens": 67265560} +{"current_steps": 116040, "total_steps": 119360, "loss": 0.4714, "lr": 2.3563156048464486e-08, "epoch": 19.443699731903486, "percentage": 97.22, "elapsed_time": "4:34:16", "remaining_time": "0:07:50", "throughput": 4087.65, "total_tokens": 67268472} +{"current_steps": 116045, "total_steps": 119360, "loss": 0.3068, "lr": 2.349231304094368e-08, "epoch": 19.444537533512065, "percentage": 97.22, "elapsed_time": "4:34:17", "remaining_time": "0:07:50", "throughput": 4087.66, "total_tokens": 67271288} +{"current_steps": 116050, "total_steps": 119360, "loss": 0.3331, "lr": 2.342157643836329e-08, "epoch": 19.445375335120644, "percentage": 97.23, "elapsed_time": "4:34:17", "remaining_time": "0:07:49", "throughput": 4087.66, "total_tokens": 67273912} +{"current_steps": 116055, "total_steps": 119360, "loss": 0.4192, "lr": 2.3350946242235995e-08, "epoch": 19.446213136729224, "percentage": 97.23, "elapsed_time": "4:34:18", "remaining_time": "0:07:48", "throughput": 4087.67, "total_tokens": 67276728} +{"current_steps": 116060, "total_steps": 119360, "loss": 0.4845, "lr": 2.3280422454071695e-08, "epoch": 19.447050938337803, "percentage": 97.24, "elapsed_time": "4:34:19", "remaining_time": "0:07:47", "throughput": 4087.68, "total_tokens": 67279544} +{"current_steps": 116065, "total_steps": 119360, "loss": 0.422, "lr": 2.321000507537863e-08, "epoch": 19.447888739946382, "percentage": 97.24, "elapsed_time": "4:34:19", "remaining_time": "0:07:47", "throughput": 4087.68, "total_tokens": 67282328} +{"current_steps": 116070, "total_steps": 119360, "loss": 0.4195, "lr": 2.3139694107662258e-08, "epoch": 19.44872654155496, "percentage": 97.24, "elapsed_time": "4:34:20", "remaining_time": "0:07:46", "throughput": 4087.69, "total_tokens": 67285048} +{"current_steps": 116075, "total_steps": 119360, "loss": 0.4386, "lr": 2.306948955242583e-08, "epoch": 19.449564343163537, "percentage": 97.25, "elapsed_time": "4:34:21", "remaining_time": "0:07:45", "throughput": 4087.69, "total_tokens": 67287768} +{"current_steps": 116080, "total_steps": 119360, "loss": 0.3049, "lr": 2.2999391411170358e-08, "epoch": 19.450402144772116, "percentage": 97.25, "elapsed_time": "4:34:21", "remaining_time": "0:07:45", "throughput": 4087.7, "total_tokens": 67290712} +{"current_steps": 116085, "total_steps": 119360, "loss": 0.2024, "lr": 2.2929399685395203e-08, "epoch": 19.451239946380696, "percentage": 97.26, "elapsed_time": "4:34:22", "remaining_time": "0:07:44", "throughput": 4087.71, "total_tokens": 67293592} +{"current_steps": 116090, "total_steps": 119360, "loss": 0.3548, "lr": 2.2859514376596392e-08, "epoch": 19.452077747989275, "percentage": 97.26, "elapsed_time": "4:34:23", "remaining_time": "0:07:43", "throughput": 4087.72, "total_tokens": 67296440} +{"current_steps": 116095, "total_steps": 119360, "loss": 0.1583, "lr": 2.2789735486268283e-08, "epoch": 19.452915549597854, "percentage": 97.26, "elapsed_time": "4:34:23", "remaining_time": "0:07:43", "throughput": 4087.73, "total_tokens": 67299352} +{"current_steps": 116100, "total_steps": 119360, "loss": 0.1752, "lr": 2.272006301590246e-08, "epoch": 19.453753351206434, "percentage": 97.27, "elapsed_time": "4:34:24", "remaining_time": "0:07:42", "throughput": 4087.75, "total_tokens": 67302296} +{"current_steps": 116105, "total_steps": 119360, "loss": 0.391, "lr": 2.26504969669894e-08, "epoch": 19.454591152815013, "percentage": 97.27, "elapsed_time": "4:34:25", "remaining_time": "0:07:41", "throughput": 4087.76, "total_tokens": 67305240} +{"current_steps": 116110, "total_steps": 119360, "loss": 0.3118, "lr": 2.2581037341016243e-08, "epoch": 19.455428954423592, "percentage": 97.28, "elapsed_time": "4:34:25", "remaining_time": "0:07:40", "throughput": 4087.77, "total_tokens": 67308504} +{"current_steps": 116115, "total_steps": 119360, "loss": 0.1645, "lr": 2.2511684139467914e-08, "epoch": 19.45626675603217, "percentage": 97.28, "elapsed_time": "4:34:26", "remaining_time": "0:07:40", "throughput": 4087.78, "total_tokens": 67311608} +{"current_steps": 116120, "total_steps": 119360, "loss": 0.3366, "lr": 2.2442437363827118e-08, "epoch": 19.45710455764075, "percentage": 97.29, "elapsed_time": "4:34:27", "remaining_time": "0:07:39", "throughput": 4087.8, "total_tokens": 67314648} +{"current_steps": 116125, "total_steps": 119360, "loss": 0.3553, "lr": 2.237329701557489e-08, "epoch": 19.45794235924933, "percentage": 97.29, "elapsed_time": "4:34:27", "remaining_time": "0:07:38", "throughput": 4087.8, "total_tokens": 67317496} +{"current_steps": 116130, "total_steps": 119360, "loss": 0.2287, "lr": 2.2304263096189495e-08, "epoch": 19.45878016085791, "percentage": 97.29, "elapsed_time": "4:34:28", "remaining_time": "0:07:38", "throughput": 4087.82, "total_tokens": 67320376} +{"current_steps": 116135, "total_steps": 119360, "loss": 0.3296, "lr": 2.2235335607146968e-08, "epoch": 19.45961796246649, "percentage": 97.3, "elapsed_time": "4:34:29", "remaining_time": "0:07:37", "throughput": 4087.83, "total_tokens": 67323288} +{"current_steps": 116140, "total_steps": 119360, "loss": 0.2797, "lr": 2.216651454992058e-08, "epoch": 19.460455764075068, "percentage": 97.3, "elapsed_time": "4:34:29", "remaining_time": "0:07:36", "throughput": 4087.83, "total_tokens": 67326040} +{"current_steps": 116145, "total_steps": 119360, "loss": 0.4978, "lr": 2.209779992598249e-08, "epoch": 19.461293565683647, "percentage": 97.31, "elapsed_time": "4:34:30", "remaining_time": "0:07:35", "throughput": 4087.85, "total_tokens": 67329080} +{"current_steps": 116150, "total_steps": 119360, "loss": 0.3168, "lr": 2.2029191736801515e-08, "epoch": 19.462131367292226, "percentage": 97.31, "elapsed_time": "4:34:31", "remaining_time": "0:07:35", "throughput": 4087.86, "total_tokens": 67332056} +{"current_steps": 116155, "total_steps": 119360, "loss": 0.2384, "lr": 2.196068998384482e-08, "epoch": 19.462969168900806, "percentage": 97.31, "elapsed_time": "4:34:31", "remaining_time": "0:07:34", "throughput": 4087.87, "total_tokens": 67334968} +{"current_steps": 116160, "total_steps": 119360, "loss": 0.2086, "lr": 2.1892294668576786e-08, "epoch": 19.463806970509385, "percentage": 97.32, "elapsed_time": "4:34:32", "remaining_time": "0:07:33", "throughput": 4087.87, "total_tokens": 67337816} +{"current_steps": 116165, "total_steps": 119360, "loss": 0.4133, "lr": 2.1824005792460688e-08, "epoch": 19.464644772117964, "percentage": 97.32, "elapsed_time": "4:34:33", "remaining_time": "0:07:33", "throughput": 4087.88, "total_tokens": 67340504} +{"current_steps": 116170, "total_steps": 119360, "loss": 0.5788, "lr": 2.1755823356955364e-08, "epoch": 19.46548257372654, "percentage": 97.33, "elapsed_time": "4:34:33", "remaining_time": "0:07:32", "throughput": 4087.89, "total_tokens": 67343672} +{"current_steps": 116175, "total_steps": 119360, "loss": 0.3066, "lr": 2.168774736351964e-08, "epoch": 19.46632037533512, "percentage": 97.33, "elapsed_time": "4:34:34", "remaining_time": "0:07:31", "throughput": 4087.89, "total_tokens": 67346424} +{"current_steps": 116180, "total_steps": 119360, "loss": 0.4328, "lr": 2.1619777813608467e-08, "epoch": 19.4671581769437, "percentage": 97.34, "elapsed_time": "4:34:35", "remaining_time": "0:07:30", "throughput": 4087.9, "total_tokens": 67349496} +{"current_steps": 116185, "total_steps": 119360, "loss": 0.291, "lr": 2.1551914708675127e-08, "epoch": 19.467995978552278, "percentage": 97.34, "elapsed_time": "4:34:35", "remaining_time": "0:07:30", "throughput": 4087.91, "total_tokens": 67352376} +{"current_steps": 116190, "total_steps": 119360, "loss": 0.4901, "lr": 2.1484158050171234e-08, "epoch": 19.468833780160857, "percentage": 97.34, "elapsed_time": "4:34:36", "remaining_time": "0:07:29", "throughput": 4087.91, "total_tokens": 67354840} +{"current_steps": 116195, "total_steps": 119360, "loss": 0.3652, "lr": 2.1416507839545074e-08, "epoch": 19.469671581769436, "percentage": 97.35, "elapsed_time": "4:34:37", "remaining_time": "0:07:28", "throughput": 4087.92, "total_tokens": 67357752} +{"current_steps": 116200, "total_steps": 119360, "loss": 0.4674, "lr": 2.1348964078242716e-08, "epoch": 19.470509383378015, "percentage": 97.35, "elapsed_time": "4:34:37", "remaining_time": "0:07:28", "throughput": 4087.93, "total_tokens": 67360664} +{"current_steps": 116205, "total_steps": 119360, "loss": 0.5302, "lr": 2.1281526767709115e-08, "epoch": 19.471347184986595, "percentage": 97.36, "elapsed_time": "4:34:38", "remaining_time": "0:07:27", "throughput": 4087.94, "total_tokens": 67363800} +{"current_steps": 116210, "total_steps": 119360, "loss": 0.2432, "lr": 2.1214195909386447e-08, "epoch": 19.472184986595174, "percentage": 97.36, "elapsed_time": "4:34:39", "remaining_time": "0:07:26", "throughput": 4087.95, "total_tokens": 67366744} +{"current_steps": 116215, "total_steps": 119360, "loss": 0.3948, "lr": 2.114697150471301e-08, "epoch": 19.473022788203753, "percentage": 97.37, "elapsed_time": "4:34:40", "remaining_time": "0:07:25", "throughput": 4087.95, "total_tokens": 67369528} +{"current_steps": 116220, "total_steps": 119360, "loss": 0.4842, "lr": 2.1079853555127093e-08, "epoch": 19.473860589812332, "percentage": 97.37, "elapsed_time": "4:34:40", "remaining_time": "0:07:25", "throughput": 4087.95, "total_tokens": 67372152} +{"current_steps": 116225, "total_steps": 119360, "loss": 0.3139, "lr": 2.1012842062063666e-08, "epoch": 19.47469839142091, "percentage": 97.37, "elapsed_time": "4:34:41", "remaining_time": "0:07:24", "throughput": 4087.96, "total_tokens": 67374872} +{"current_steps": 116230, "total_steps": 119360, "loss": 0.2252, "lr": 2.0945937026955465e-08, "epoch": 19.47553619302949, "percentage": 97.38, "elapsed_time": "4:34:41", "remaining_time": "0:07:23", "throughput": 4087.96, "total_tokens": 67377752} +{"current_steps": 116235, "total_steps": 119360, "loss": 0.2651, "lr": 2.0879138451233015e-08, "epoch": 19.47637399463807, "percentage": 97.38, "elapsed_time": "4:34:42", "remaining_time": "0:07:23", "throughput": 4087.98, "total_tokens": 67381016} +{"current_steps": 116240, "total_steps": 119360, "loss": 0.2316, "lr": 2.081244633632462e-08, "epoch": 19.47721179624665, "percentage": 97.39, "elapsed_time": "4:34:43", "remaining_time": "0:07:22", "throughput": 4087.99, "total_tokens": 67383864} +{"current_steps": 116245, "total_steps": 119360, "loss": 0.6241, "lr": 2.074586068365636e-08, "epoch": 19.47804959785523, "percentage": 97.39, "elapsed_time": "4:34:44", "remaining_time": "0:07:21", "throughput": 4088.0, "total_tokens": 67386776} +{"current_steps": 116250, "total_steps": 119360, "loss": 0.3329, "lr": 2.067938149465154e-08, "epoch": 19.478887399463808, "percentage": 97.39, "elapsed_time": "4:34:44", "remaining_time": "0:07:21", "throughput": 4088.0, "total_tokens": 67389528} +{"current_steps": 116255, "total_steps": 119360, "loss": 0.1852, "lr": 2.0613008770731802e-08, "epoch": 19.479725201072387, "percentage": 97.4, "elapsed_time": "4:34:45", "remaining_time": "0:07:20", "throughput": 4088.01, "total_tokens": 67392376} +{"current_steps": 116260, "total_steps": 119360, "loss": 0.3278, "lr": 2.0546742513316563e-08, "epoch": 19.480563002680967, "percentage": 97.4, "elapsed_time": "4:34:46", "remaining_time": "0:07:19", "throughput": 4088.02, "total_tokens": 67395224} +{"current_steps": 116265, "total_steps": 119360, "loss": 0.2361, "lr": 2.048058272382192e-08, "epoch": 19.481400804289546, "percentage": 97.41, "elapsed_time": "4:34:46", "remaining_time": "0:07:18", "throughput": 4088.03, "total_tokens": 67398168} +{"current_steps": 116270, "total_steps": 119360, "loss": 0.479, "lr": 2.0414529403663398e-08, "epoch": 19.48223860589812, "percentage": 97.41, "elapsed_time": "4:34:47", "remaining_time": "0:07:18", "throughput": 4088.04, "total_tokens": 67401176} +{"current_steps": 116275, "total_steps": 119360, "loss": 0.405, "lr": 2.034858255425265e-08, "epoch": 19.4830764075067, "percentage": 97.42, "elapsed_time": "4:34:48", "remaining_time": "0:07:17", "throughput": 4088.04, "total_tokens": 67404024} +{"current_steps": 116280, "total_steps": 119360, "loss": 0.4123, "lr": 2.0282742177000214e-08, "epoch": 19.48391420911528, "percentage": 97.42, "elapsed_time": "4:34:48", "remaining_time": "0:07:16", "throughput": 4088.06, "total_tokens": 67406968} +{"current_steps": 116285, "total_steps": 119360, "loss": 0.4535, "lr": 2.02170082733133e-08, "epoch": 19.48475201072386, "percentage": 97.42, "elapsed_time": "4:34:49", "remaining_time": "0:07:16", "throughput": 4088.06, "total_tokens": 67409784} +{"current_steps": 116290, "total_steps": 119360, "loss": 0.2294, "lr": 2.0151380844598e-08, "epoch": 19.48558981233244, "percentage": 97.43, "elapsed_time": "4:34:50", "remaining_time": "0:07:15", "throughput": 4088.07, "total_tokens": 67412696} +{"current_steps": 116295, "total_steps": 119360, "loss": 0.1711, "lr": 2.008585989225709e-08, "epoch": 19.486427613941018, "percentage": 97.43, "elapsed_time": "4:34:50", "remaining_time": "0:07:14", "throughput": 4088.08, "total_tokens": 67415736} +{"current_steps": 116300, "total_steps": 119360, "loss": 0.5875, "lr": 2.002044541769166e-08, "epoch": 19.487265415549597, "percentage": 97.44, "elapsed_time": "4:34:51", "remaining_time": "0:07:13", "throughput": 4088.09, "total_tokens": 67418648} +{"current_steps": 116305, "total_steps": 119360, "loss": 0.46, "lr": 1.995513742230004e-08, "epoch": 19.488103217158177, "percentage": 97.44, "elapsed_time": "4:34:52", "remaining_time": "0:07:13", "throughput": 4088.09, "total_tokens": 67421368} +{"current_steps": 116310, "total_steps": 119360, "loss": 0.1437, "lr": 1.9889935907478896e-08, "epoch": 19.488941018766756, "percentage": 97.44, "elapsed_time": "4:34:52", "remaining_time": "0:07:12", "throughput": 4088.11, "total_tokens": 67424504} +{"current_steps": 116315, "total_steps": 119360, "loss": 0.3282, "lr": 1.9824840874622662e-08, "epoch": 19.489778820375335, "percentage": 97.45, "elapsed_time": "4:34:53", "remaining_time": "0:07:11", "throughput": 4088.11, "total_tokens": 67427384} +{"current_steps": 116320, "total_steps": 119360, "loss": 0.2248, "lr": 1.9759852325123008e-08, "epoch": 19.490616621983914, "percentage": 97.45, "elapsed_time": "4:34:54", "remaining_time": "0:07:11", "throughput": 4088.12, "total_tokens": 67430232} +{"current_steps": 116325, "total_steps": 119360, "loss": 0.3273, "lr": 1.9694970260368818e-08, "epoch": 19.491454423592494, "percentage": 97.46, "elapsed_time": "4:34:54", "remaining_time": "0:07:10", "throughput": 4088.13, "total_tokens": 67433016} +{"current_steps": 116330, "total_steps": 119360, "loss": 0.2634, "lr": 1.9630194681748427e-08, "epoch": 19.492292225201073, "percentage": 97.46, "elapsed_time": "4:34:55", "remaining_time": "0:07:09", "throughput": 4088.14, "total_tokens": 67435800} +{"current_steps": 116335, "total_steps": 119360, "loss": 0.3997, "lr": 1.9565525590645728e-08, "epoch": 19.493130026809652, "percentage": 97.47, "elapsed_time": "4:34:56", "remaining_time": "0:07:08", "throughput": 4088.16, "total_tokens": 67439128} +{"current_steps": 116340, "total_steps": 119360, "loss": 0.207, "lr": 1.950096298844406e-08, "epoch": 19.49396782841823, "percentage": 97.47, "elapsed_time": "4:34:56", "remaining_time": "0:07:08", "throughput": 4088.17, "total_tokens": 67442072} +{"current_steps": 116345, "total_steps": 119360, "loss": 0.3596, "lr": 1.9436506876523986e-08, "epoch": 19.49480563002681, "percentage": 97.47, "elapsed_time": "4:34:57", "remaining_time": "0:07:07", "throughput": 4088.17, "total_tokens": 67444920} +{"current_steps": 116350, "total_steps": 119360, "loss": 0.2627, "lr": 1.937215725626329e-08, "epoch": 19.49564343163539, "percentage": 97.48, "elapsed_time": "4:34:58", "remaining_time": "0:07:06", "throughput": 4088.18, "total_tokens": 67447544} +{"current_steps": 116355, "total_steps": 119360, "loss": 0.6895, "lr": 1.9307914129038097e-08, "epoch": 19.49648123324397, "percentage": 97.48, "elapsed_time": "4:34:58", "remaining_time": "0:07:06", "throughput": 4088.19, "total_tokens": 67450680} +{"current_steps": 116360, "total_steps": 119360, "loss": 0.3531, "lr": 1.9243777496222303e-08, "epoch": 19.49731903485255, "percentage": 97.49, "elapsed_time": "4:34:59", "remaining_time": "0:07:05", "throughput": 4088.2, "total_tokens": 67453592} +{"current_steps": 116365, "total_steps": 119360, "loss": 0.4712, "lr": 1.9179747359186484e-08, "epoch": 19.498156836461128, "percentage": 97.49, "elapsed_time": "4:35:00", "remaining_time": "0:07:04", "throughput": 4088.21, "total_tokens": 67456312} +{"current_steps": 116370, "total_steps": 119360, "loss": 0.585, "lr": 1.9115823719300098e-08, "epoch": 19.498994638069703, "percentage": 97.49, "elapsed_time": "4:35:00", "remaining_time": "0:07:03", "throughput": 4088.22, "total_tokens": 67459160} +{"current_steps": 116375, "total_steps": 119360, "loss": 0.798, "lr": 1.905200657793038e-08, "epoch": 19.499832439678283, "percentage": 97.5, "elapsed_time": "4:35:01", "remaining_time": "0:07:03", "throughput": 4088.23, "total_tokens": 67462008} +{"current_steps": 116380, "total_steps": 119360, "loss": 0.3378, "lr": 1.8988295936440692e-08, "epoch": 19.500670241286862, "percentage": 97.5, "elapsed_time": "4:35:02", "remaining_time": "0:07:02", "throughput": 4088.23, "total_tokens": 67464792} +{"current_steps": 116385, "total_steps": 119360, "loss": 0.4558, "lr": 1.8924691796194384e-08, "epoch": 19.50150804289544, "percentage": 97.51, "elapsed_time": "4:35:02", "remaining_time": "0:07:01", "throughput": 4088.24, "total_tokens": 67467608} +{"current_steps": 116390, "total_steps": 119360, "loss": 0.5232, "lr": 1.886119415855092e-08, "epoch": 19.50234584450402, "percentage": 97.51, "elapsed_time": "4:35:03", "remaining_time": "0:07:01", "throughput": 4088.25, "total_tokens": 67470392} +{"current_steps": 116395, "total_steps": 119360, "loss": 0.6028, "lr": 1.879780302486811e-08, "epoch": 19.5031836461126, "percentage": 97.52, "elapsed_time": "4:35:04", "remaining_time": "0:07:00", "throughput": 4088.26, "total_tokens": 67473336} +{"current_steps": 116400, "total_steps": 119360, "loss": 0.4337, "lr": 1.8734518396500977e-08, "epoch": 19.50402144772118, "percentage": 97.52, "elapsed_time": "4:35:04", "remaining_time": "0:06:59", "throughput": 4088.26, "total_tokens": 67476024} +{"current_steps": 116405, "total_steps": 119360, "loss": 0.3427, "lr": 1.867134027480344e-08, "epoch": 19.50485924932976, "percentage": 97.52, "elapsed_time": "4:35:05", "remaining_time": "0:06:58", "throughput": 4088.27, "total_tokens": 67478712} +{"current_steps": 116410, "total_steps": 119360, "loss": 0.417, "lr": 1.8608268661125527e-08, "epoch": 19.505697050938338, "percentage": 97.53, "elapsed_time": "4:35:06", "remaining_time": "0:06:58", "throughput": 4088.27, "total_tokens": 67481208} +{"current_steps": 116415, "total_steps": 119360, "loss": 0.5112, "lr": 1.854530355681561e-08, "epoch": 19.506534852546917, "percentage": 97.53, "elapsed_time": "4:35:06", "remaining_time": "0:06:57", "throughput": 4088.27, "total_tokens": 67484024} +{"current_steps": 116420, "total_steps": 119360, "loss": 0.2966, "lr": 1.848244496322149e-08, "epoch": 19.507372654155496, "percentage": 97.54, "elapsed_time": "4:35:07", "remaining_time": "0:06:56", "throughput": 4088.28, "total_tokens": 67486840} +{"current_steps": 116425, "total_steps": 119360, "loss": 0.506, "lr": 1.8419692881685436e-08, "epoch": 19.508210455764075, "percentage": 97.54, "elapsed_time": "4:35:08", "remaining_time": "0:06:56", "throughput": 4088.29, "total_tokens": 67489720} +{"current_steps": 116430, "total_steps": 119360, "loss": 0.2689, "lr": 1.8357047313550258e-08, "epoch": 19.509048257372655, "percentage": 97.55, "elapsed_time": "4:35:08", "remaining_time": "0:06:55", "throughput": 4088.29, "total_tokens": 67492408} +{"current_steps": 116435, "total_steps": 119360, "loss": 0.3712, "lr": 1.8294508260154885e-08, "epoch": 19.509886058981234, "percentage": 97.55, "elapsed_time": "4:35:09", "remaining_time": "0:06:54", "throughput": 4088.29, "total_tokens": 67495224} +{"current_steps": 116440, "total_steps": 119360, "loss": 0.3136, "lr": 1.8232075722836584e-08, "epoch": 19.510723860589813, "percentage": 97.55, "elapsed_time": "4:35:10", "remaining_time": "0:06:54", "throughput": 4088.31, "total_tokens": 67498168} +{"current_steps": 116445, "total_steps": 119360, "loss": 0.4869, "lr": 1.8169749702930394e-08, "epoch": 19.511561662198392, "percentage": 97.56, "elapsed_time": "4:35:10", "remaining_time": "0:06:53", "throughput": 4088.31, "total_tokens": 67500920} +{"current_steps": 116450, "total_steps": 119360, "loss": 0.3621, "lr": 1.8107530201768586e-08, "epoch": 19.51239946380697, "percentage": 97.56, "elapsed_time": "4:35:11", "remaining_time": "0:06:52", "throughput": 4088.32, "total_tokens": 67503960} +{"current_steps": 116455, "total_steps": 119360, "loss": 0.4445, "lr": 1.804541722068176e-08, "epoch": 19.51323726541555, "percentage": 97.57, "elapsed_time": "4:35:12", "remaining_time": "0:06:51", "throughput": 4088.33, "total_tokens": 67506552} +{"current_steps": 116460, "total_steps": 119360, "loss": 0.324, "lr": 1.79834107609983e-08, "epoch": 19.51407506702413, "percentage": 97.57, "elapsed_time": "4:35:12", "remaining_time": "0:06:51", "throughput": 4088.34, "total_tokens": 67509592} +{"current_steps": 116465, "total_steps": 119360, "loss": 0.5144, "lr": 1.7921510824043807e-08, "epoch": 19.514912868632706, "percentage": 97.57, "elapsed_time": "4:35:13", "remaining_time": "0:06:50", "throughput": 4088.35, "total_tokens": 67512600} +{"current_steps": 116470, "total_steps": 119360, "loss": 0.2451, "lr": 1.7859717411141675e-08, "epoch": 19.515750670241285, "percentage": 97.58, "elapsed_time": "4:35:14", "remaining_time": "0:06:49", "throughput": 4088.36, "total_tokens": 67515480} +{"current_steps": 116475, "total_steps": 119360, "loss": 0.1855, "lr": 1.7798030523613065e-08, "epoch": 19.516588471849865, "percentage": 97.58, "elapsed_time": "4:35:14", "remaining_time": "0:06:49", "throughput": 4088.37, "total_tokens": 67518392} +{"current_steps": 116480, "total_steps": 119360, "loss": 0.569, "lr": 1.773645016277692e-08, "epoch": 19.517426273458444, "percentage": 97.59, "elapsed_time": "4:35:15", "remaining_time": "0:06:48", "throughput": 4088.37, "total_tokens": 67521208} +{"current_steps": 116485, "total_steps": 119360, "loss": 0.3674, "lr": 1.7674976329949965e-08, "epoch": 19.518264075067023, "percentage": 97.59, "elapsed_time": "4:35:16", "remaining_time": "0:06:47", "throughput": 4088.38, "total_tokens": 67524184} +{"current_steps": 116490, "total_steps": 119360, "loss": 0.1142, "lr": 1.761360902644671e-08, "epoch": 19.519101876675602, "percentage": 97.6, "elapsed_time": "4:35:16", "remaining_time": "0:06:46", "throughput": 4088.39, "total_tokens": 67527064} +{"current_steps": 116495, "total_steps": 119360, "loss": 0.3115, "lr": 1.7552348253578876e-08, "epoch": 19.51993967828418, "percentage": 97.6, "elapsed_time": "4:35:17", "remaining_time": "0:06:46", "throughput": 4088.4, "total_tokens": 67530008} +{"current_steps": 116500, "total_steps": 119360, "loss": 0.5084, "lr": 1.7491194012657087e-08, "epoch": 19.52077747989276, "percentage": 97.6, "elapsed_time": "4:35:18", "remaining_time": "0:06:45", "throughput": 4088.41, "total_tokens": 67533048} +{"current_steps": 116505, "total_steps": 119360, "loss": 0.3724, "lr": 1.743014630498807e-08, "epoch": 19.52161528150134, "percentage": 97.61, "elapsed_time": "4:35:18", "remaining_time": "0:06:44", "throughput": 4088.42, "total_tokens": 67535960} +{"current_steps": 116510, "total_steps": 119360, "loss": 0.3116, "lr": 1.7369205131878008e-08, "epoch": 19.52245308310992, "percentage": 97.61, "elapsed_time": "4:35:19", "remaining_time": "0:06:44", "throughput": 4088.42, "total_tokens": 67538744} +{"current_steps": 116515, "total_steps": 119360, "loss": 0.1739, "lr": 1.7308370494628636e-08, "epoch": 19.5232908847185, "percentage": 97.62, "elapsed_time": "4:35:20", "remaining_time": "0:06:43", "throughput": 4088.43, "total_tokens": 67541624} +{"current_steps": 116520, "total_steps": 119360, "loss": 0.5717, "lr": 1.724764239454224e-08, "epoch": 19.524128686327078, "percentage": 97.62, "elapsed_time": "4:35:20", "remaining_time": "0:06:42", "throughput": 4088.44, "total_tokens": 67544376} +{"current_steps": 116525, "total_steps": 119360, "loss": 0.3838, "lr": 1.7187020832916124e-08, "epoch": 19.524966487935657, "percentage": 97.62, "elapsed_time": "4:35:21", "remaining_time": "0:06:41", "throughput": 4088.44, "total_tokens": 67547064} +{"current_steps": 116530, "total_steps": 119360, "loss": 0.1999, "lr": 1.7126505811047023e-08, "epoch": 19.525804289544237, "percentage": 97.63, "elapsed_time": "4:35:22", "remaining_time": "0:06:41", "throughput": 4088.45, "total_tokens": 67550040} +{"current_steps": 116535, "total_steps": 119360, "loss": 0.2812, "lr": 1.7066097330228348e-08, "epoch": 19.526642091152816, "percentage": 97.63, "elapsed_time": "4:35:22", "remaining_time": "0:06:40", "throughput": 4088.45, "total_tokens": 67552632} +{"current_steps": 116540, "total_steps": 119360, "loss": 0.389, "lr": 1.7005795391752398e-08, "epoch": 19.527479892761395, "percentage": 97.64, "elapsed_time": "4:35:23", "remaining_time": "0:06:39", "throughput": 4088.46, "total_tokens": 67555672} +{"current_steps": 116545, "total_steps": 119360, "loss": 0.4005, "lr": 1.6945599996908148e-08, "epoch": 19.528317694369974, "percentage": 97.64, "elapsed_time": "4:35:24", "remaining_time": "0:06:39", "throughput": 4088.47, "total_tokens": 67558520} +{"current_steps": 116550, "total_steps": 119360, "loss": 0.2819, "lr": 1.6885511146982338e-08, "epoch": 19.529155495978554, "percentage": 97.65, "elapsed_time": "4:35:24", "remaining_time": "0:06:38", "throughput": 4088.48, "total_tokens": 67561720} +{"current_steps": 116555, "total_steps": 119360, "loss": 0.6196, "lr": 1.6825528843260054e-08, "epoch": 19.529993297587133, "percentage": 97.65, "elapsed_time": "4:35:25", "remaining_time": "0:06:37", "throughput": 4088.48, "total_tokens": 67564472} +{"current_steps": 116560, "total_steps": 119360, "loss": 0.2995, "lr": 1.6765653087023604e-08, "epoch": 19.530831099195712, "percentage": 97.65, "elapsed_time": "4:35:26", "remaining_time": "0:06:36", "throughput": 4088.49, "total_tokens": 67567320} +{"current_steps": 116565, "total_steps": 119360, "loss": 0.2285, "lr": 1.6705883879554185e-08, "epoch": 19.531668900804288, "percentage": 97.66, "elapsed_time": "4:35:26", "remaining_time": "0:06:36", "throughput": 4088.49, "total_tokens": 67570040} +{"current_steps": 116570, "total_steps": 119360, "loss": 0.3705, "lr": 1.6646221222128557e-08, "epoch": 19.532506702412867, "percentage": 97.66, "elapsed_time": "4:35:27", "remaining_time": "0:06:35", "throughput": 4088.5, "total_tokens": 67573048} +{"current_steps": 116575, "total_steps": 119360, "loss": 0.3303, "lr": 1.6586665116022362e-08, "epoch": 19.533344504021446, "percentage": 97.67, "elapsed_time": "4:35:28", "remaining_time": "0:06:34", "throughput": 4088.51, "total_tokens": 67575800} +{"current_steps": 116580, "total_steps": 119360, "loss": 0.2846, "lr": 1.6527215562510135e-08, "epoch": 19.534182305630026, "percentage": 97.67, "elapsed_time": "4:35:28", "remaining_time": "0:06:34", "throughput": 4088.52, "total_tokens": 67578616} +{"current_steps": 116585, "total_steps": 119360, "loss": 0.2434, "lr": 1.646787256286253e-08, "epoch": 19.535020107238605, "percentage": 97.68, "elapsed_time": "4:35:29", "remaining_time": "0:06:33", "throughput": 4088.53, "total_tokens": 67581656} +{"current_steps": 116590, "total_steps": 119360, "loss": 0.4778, "lr": 1.640863611834742e-08, "epoch": 19.535857908847184, "percentage": 97.68, "elapsed_time": "4:35:30", "remaining_time": "0:06:32", "throughput": 4088.54, "total_tokens": 67584728} +{"current_steps": 116595, "total_steps": 119360, "loss": 0.2597, "lr": 1.6349506230232683e-08, "epoch": 19.536695710455763, "percentage": 97.68, "elapsed_time": "4:35:30", "remaining_time": "0:06:32", "throughput": 4088.56, "total_tokens": 67587672} +{"current_steps": 116600, "total_steps": 119360, "loss": 0.2906, "lr": 1.6290482899781746e-08, "epoch": 19.537533512064343, "percentage": 97.69, "elapsed_time": "4:35:31", "remaining_time": "0:06:31", "throughput": 4088.56, "total_tokens": 67590392} +{"current_steps": 116605, "total_steps": 119360, "loss": 0.3408, "lr": 1.6231566128256938e-08, "epoch": 19.538371313672922, "percentage": 97.69, "elapsed_time": "4:35:32", "remaining_time": "0:06:30", "throughput": 4088.57, "total_tokens": 67593336} +{"current_steps": 116610, "total_steps": 119360, "loss": 0.3053, "lr": 1.6172755916917804e-08, "epoch": 19.5392091152815, "percentage": 97.7, "elapsed_time": "4:35:32", "remaining_time": "0:06:29", "throughput": 4088.58, "total_tokens": 67596280} +{"current_steps": 116615, "total_steps": 119360, "loss": 0.2307, "lr": 1.6114052267022228e-08, "epoch": 19.54004691689008, "percentage": 97.7, "elapsed_time": "4:35:33", "remaining_time": "0:06:29", "throughput": 4088.59, "total_tokens": 67599160} +{"current_steps": 116620, "total_steps": 119360, "loss": 0.26, "lr": 1.605545517982532e-08, "epoch": 19.54088471849866, "percentage": 97.7, "elapsed_time": "4:35:34", "remaining_time": "0:06:28", "throughput": 4088.59, "total_tokens": 67601848} +{"current_steps": 116625, "total_steps": 119360, "loss": 0.1475, "lr": 1.5996964656579405e-08, "epoch": 19.54172252010724, "percentage": 97.71, "elapsed_time": "4:35:34", "remaining_time": "0:06:27", "throughput": 4088.6, "total_tokens": 67604600} +{"current_steps": 116630, "total_steps": 119360, "loss": 0.1747, "lr": 1.5938580698535154e-08, "epoch": 19.54256032171582, "percentage": 97.71, "elapsed_time": "4:35:35", "remaining_time": "0:06:27", "throughput": 4088.61, "total_tokens": 67607512} +{"current_steps": 116635, "total_steps": 119360, "loss": 0.3798, "lr": 1.588030330694157e-08, "epoch": 19.543398123324398, "percentage": 97.72, "elapsed_time": "4:35:36", "remaining_time": "0:06:26", "throughput": 4088.63, "total_tokens": 67610552} +{"current_steps": 116640, "total_steps": 119360, "loss": 0.3837, "lr": 1.5822132483044318e-08, "epoch": 19.544235924932977, "percentage": 97.72, "elapsed_time": "4:35:36", "remaining_time": "0:06:25", "throughput": 4088.64, "total_tokens": 67613464} +{"current_steps": 116645, "total_steps": 119360, "loss": 0.3467, "lr": 1.5764068228087404e-08, "epoch": 19.545073726541556, "percentage": 97.73, "elapsed_time": "4:35:37", "remaining_time": "0:06:24", "throughput": 4088.65, "total_tokens": 67616568} +{"current_steps": 116650, "total_steps": 119360, "loss": 0.1433, "lr": 1.5706110543311503e-08, "epoch": 19.545911528150135, "percentage": 97.73, "elapsed_time": "4:35:38", "remaining_time": "0:06:24", "throughput": 4088.66, "total_tokens": 67619352} +{"current_steps": 116655, "total_steps": 119360, "loss": 0.3236, "lr": 1.5648259429956735e-08, "epoch": 19.546749329758715, "percentage": 97.73, "elapsed_time": "4:35:38", "remaining_time": "0:06:23", "throughput": 4088.67, "total_tokens": 67622232} +{"current_steps": 116660, "total_steps": 119360, "loss": 0.3879, "lr": 1.559051488925989e-08, "epoch": 19.547587131367294, "percentage": 97.74, "elapsed_time": "4:35:39", "remaining_time": "0:06:22", "throughput": 4088.67, "total_tokens": 67624920} +{"current_steps": 116665, "total_steps": 119360, "loss": 0.3576, "lr": 1.553287692245553e-08, "epoch": 19.54842493297587, "percentage": 97.74, "elapsed_time": "4:35:40", "remaining_time": "0:06:22", "throughput": 4088.68, "total_tokens": 67627768} +{"current_steps": 116670, "total_steps": 119360, "loss": 0.4185, "lr": 1.5475345530775454e-08, "epoch": 19.54926273458445, "percentage": 97.75, "elapsed_time": "4:35:40", "remaining_time": "0:06:21", "throughput": 4088.69, "total_tokens": 67630680} +{"current_steps": 116675, "total_steps": 119360, "loss": 0.2729, "lr": 1.5417920715450896e-08, "epoch": 19.55010053619303, "percentage": 97.75, "elapsed_time": "4:35:41", "remaining_time": "0:06:20", "throughput": 4088.7, "total_tokens": 67633560} +{"current_steps": 116680, "total_steps": 119360, "loss": 0.4832, "lr": 1.5360602477708652e-08, "epoch": 19.550938337801608, "percentage": 97.75, "elapsed_time": "4:35:42", "remaining_time": "0:06:19", "throughput": 4088.71, "total_tokens": 67636536} +{"current_steps": 116685, "total_steps": 119360, "loss": 0.3291, "lr": 1.5303390818774965e-08, "epoch": 19.551776139410187, "percentage": 97.76, "elapsed_time": "4:35:42", "remaining_time": "0:06:19", "throughput": 4088.72, "total_tokens": 67639288} +{"current_steps": 116690, "total_steps": 119360, "loss": 0.0729, "lr": 1.5246285739872746e-08, "epoch": 19.552613941018766, "percentage": 97.76, "elapsed_time": "4:35:43", "remaining_time": "0:06:18", "throughput": 4088.72, "total_tokens": 67641880} +{"current_steps": 116695, "total_steps": 119360, "loss": 0.2045, "lr": 1.518928724222324e-08, "epoch": 19.553451742627345, "percentage": 97.77, "elapsed_time": "4:35:44", "remaining_time": "0:06:17", "throughput": 4088.72, "total_tokens": 67644536} +{"current_steps": 116700, "total_steps": 119360, "loss": 0.2871, "lr": 1.5132395327044913e-08, "epoch": 19.554289544235925, "percentage": 97.77, "elapsed_time": "4:35:44", "remaining_time": "0:06:17", "throughput": 4088.72, "total_tokens": 67647064} +{"current_steps": 116705, "total_steps": 119360, "loss": 0.5646, "lr": 1.507560999555402e-08, "epoch": 19.555127345844504, "percentage": 97.78, "elapsed_time": "4:35:45", "remaining_time": "0:06:16", "throughput": 4088.73, "total_tokens": 67650008} +{"current_steps": 116710, "total_steps": 119360, "loss": 0.1271, "lr": 1.501893124896514e-08, "epoch": 19.555965147453083, "percentage": 97.78, "elapsed_time": "4:35:46", "remaining_time": "0:06:15", "throughput": 4088.74, "total_tokens": 67652888} +{"current_steps": 116715, "total_steps": 119360, "loss": 0.2841, "lr": 1.4962359088490085e-08, "epoch": 19.556802949061662, "percentage": 97.78, "elapsed_time": "4:35:46", "remaining_time": "0:06:14", "throughput": 4088.76, "total_tokens": 67655864} +{"current_steps": 116720, "total_steps": 119360, "loss": 0.3521, "lr": 1.490589351533789e-08, "epoch": 19.55764075067024, "percentage": 97.79, "elapsed_time": "4:35:47", "remaining_time": "0:06:14", "throughput": 4088.76, "total_tokens": 67658712} +{"current_steps": 116725, "total_steps": 119360, "loss": 0.2953, "lr": 1.4849534530717024e-08, "epoch": 19.55847855227882, "percentage": 97.79, "elapsed_time": "4:35:48", "remaining_time": "0:06:13", "throughput": 4088.77, "total_tokens": 67661464} +{"current_steps": 116730, "total_steps": 119360, "loss": 0.58, "lr": 1.4793282135831533e-08, "epoch": 19.5593163538874, "percentage": 97.8, "elapsed_time": "4:35:48", "remaining_time": "0:06:12", "throughput": 4088.77, "total_tokens": 67664408} +{"current_steps": 116735, "total_steps": 119360, "loss": 0.2058, "lr": 1.4737136331884339e-08, "epoch": 19.56015415549598, "percentage": 97.8, "elapsed_time": "4:35:49", "remaining_time": "0:06:12", "throughput": 4088.78, "total_tokens": 67667096} +{"current_steps": 116740, "total_steps": 119360, "loss": 0.2961, "lr": 1.4681097120076149e-08, "epoch": 19.56099195710456, "percentage": 97.8, "elapsed_time": "4:35:50", "remaining_time": "0:06:11", "throughput": 4088.79, "total_tokens": 67670008} +{"current_steps": 116745, "total_steps": 119360, "loss": 0.1545, "lr": 1.4625164501604894e-08, "epoch": 19.561829758713138, "percentage": 97.81, "elapsed_time": "4:35:50", "remaining_time": "0:06:10", "throughput": 4088.8, "total_tokens": 67673080} +{"current_steps": 116750, "total_steps": 119360, "loss": 0.2143, "lr": 1.4569338477666838e-08, "epoch": 19.562667560321717, "percentage": 97.81, "elapsed_time": "4:35:51", "remaining_time": "0:06:10", "throughput": 4088.81, "total_tokens": 67675960} +{"current_steps": 116755, "total_steps": 119360, "loss": 0.3235, "lr": 1.4513619049455474e-08, "epoch": 19.563505361930297, "percentage": 97.82, "elapsed_time": "4:35:52", "remaining_time": "0:06:09", "throughput": 4088.82, "total_tokens": 67678808} +{"current_steps": 116760, "total_steps": 119360, "loss": 0.2922, "lr": 1.4458006218162069e-08, "epoch": 19.564343163538872, "percentage": 97.82, "elapsed_time": "4:35:52", "remaining_time": "0:06:08", "throughput": 4088.82, "total_tokens": 67681560} +{"current_steps": 116765, "total_steps": 119360, "loss": 0.1435, "lr": 1.4402499984975671e-08, "epoch": 19.56518096514745, "percentage": 97.83, "elapsed_time": "4:35:53", "remaining_time": "0:06:07", "throughput": 4088.83, "total_tokens": 67684472} +{"current_steps": 116770, "total_steps": 119360, "loss": 0.4982, "lr": 1.434710035108311e-08, "epoch": 19.56601876675603, "percentage": 97.83, "elapsed_time": "4:35:54", "remaining_time": "0:06:07", "throughput": 4088.84, "total_tokens": 67687128} +{"current_steps": 116775, "total_steps": 119360, "loss": 0.2979, "lr": 1.4291807317669549e-08, "epoch": 19.56685656836461, "percentage": 97.83, "elapsed_time": "4:35:54", "remaining_time": "0:06:06", "throughput": 4088.85, "total_tokens": 67690040} +{"current_steps": 116780, "total_steps": 119360, "loss": 0.3165, "lr": 1.4236620885916264e-08, "epoch": 19.56769436997319, "percentage": 97.84, "elapsed_time": "4:35:55", "remaining_time": "0:06:05", "throughput": 4088.85, "total_tokens": 67692920} +{"current_steps": 116785, "total_steps": 119360, "loss": 0.3103, "lr": 1.4181541057003423e-08, "epoch": 19.56853217158177, "percentage": 97.84, "elapsed_time": "4:35:56", "remaining_time": "0:06:05", "throughput": 4088.87, "total_tokens": 67696056} +{"current_steps": 116790, "total_steps": 119360, "loss": 0.289, "lr": 1.4126567832108973e-08, "epoch": 19.569369973190348, "percentage": 97.85, "elapsed_time": "4:35:56", "remaining_time": "0:06:04", "throughput": 4088.87, "total_tokens": 67698840} +{"current_steps": 116795, "total_steps": 119360, "loss": 0.4553, "lr": 1.407170121240864e-08, "epoch": 19.570207774798927, "percentage": 97.85, "elapsed_time": "4:35:57", "remaining_time": "0:06:03", "throughput": 4088.87, "total_tokens": 67701528} +{"current_steps": 116800, "total_steps": 119360, "loss": 0.3111, "lr": 1.4016941199074819e-08, "epoch": 19.571045576407506, "percentage": 97.86, "elapsed_time": "4:35:58", "remaining_time": "0:06:02", "throughput": 4088.88, "total_tokens": 67704280} +{"current_steps": 116805, "total_steps": 119360, "loss": 0.3922, "lr": 1.3962287793278796e-08, "epoch": 19.571883378016086, "percentage": 97.86, "elapsed_time": "4:35:58", "remaining_time": "0:06:02", "throughput": 4088.88, "total_tokens": 67706808} +{"current_steps": 116810, "total_steps": 119360, "loss": 0.3339, "lr": 1.390774099618908e-08, "epoch": 19.572721179624665, "percentage": 97.86, "elapsed_time": "4:35:59", "remaining_time": "0:06:01", "throughput": 4088.88, "total_tokens": 67709464} +{"current_steps": 116815, "total_steps": 119360, "loss": 0.3566, "lr": 1.3853300808971958e-08, "epoch": 19.573558981233244, "percentage": 97.87, "elapsed_time": "4:36:00", "remaining_time": "0:06:00", "throughput": 4088.88, "total_tokens": 67711992} +{"current_steps": 116820, "total_steps": 119360, "loss": 0.2897, "lr": 1.3798967232791505e-08, "epoch": 19.574396782841823, "percentage": 97.87, "elapsed_time": "4:36:00", "remaining_time": "0:06:00", "throughput": 4088.89, "total_tokens": 67714968} +{"current_steps": 116825, "total_steps": 119360, "loss": 0.3882, "lr": 1.3744740268809565e-08, "epoch": 19.575234584450403, "percentage": 97.88, "elapsed_time": "4:36:01", "remaining_time": "0:05:59", "throughput": 4088.9, "total_tokens": 67717912} +{"current_steps": 116830, "total_steps": 119360, "loss": 0.3134, "lr": 1.3690619918184655e-08, "epoch": 19.576072386058982, "percentage": 97.88, "elapsed_time": "4:36:02", "remaining_time": "0:05:58", "throughput": 4088.92, "total_tokens": 67721080} +{"current_steps": 116835, "total_steps": 119360, "loss": 0.2435, "lr": 1.3636606182075296e-08, "epoch": 19.57691018766756, "percentage": 97.88, "elapsed_time": "4:36:02", "remaining_time": "0:05:57", "throughput": 4088.93, "total_tokens": 67724024} +{"current_steps": 116840, "total_steps": 119360, "loss": 0.2185, "lr": 1.3582699061635563e-08, "epoch": 19.57774798927614, "percentage": 97.89, "elapsed_time": "4:36:03", "remaining_time": "0:05:57", "throughput": 4088.94, "total_tokens": 67727160} +{"current_steps": 116845, "total_steps": 119360, "loss": 0.2105, "lr": 1.3528898558018422e-08, "epoch": 19.57858579088472, "percentage": 97.89, "elapsed_time": "4:36:04", "remaining_time": "0:05:56", "throughput": 4088.95, "total_tokens": 67730104} +{"current_steps": 116850, "total_steps": 119360, "loss": 0.2138, "lr": 1.3475204672374064e-08, "epoch": 19.5794235924933, "percentage": 97.9, "elapsed_time": "4:36:04", "remaining_time": "0:05:55", "throughput": 4088.96, "total_tokens": 67732856} +{"current_steps": 116855, "total_steps": 119360, "loss": 0.3672, "lr": 1.3421617405850463e-08, "epoch": 19.58026139410188, "percentage": 97.9, "elapsed_time": "4:36:05", "remaining_time": "0:05:55", "throughput": 4088.97, "total_tokens": 67735832} +{"current_steps": 116860, "total_steps": 119360, "loss": 0.3393, "lr": 1.3368136759593364e-08, "epoch": 19.581099195710454, "percentage": 97.91, "elapsed_time": "4:36:06", "remaining_time": "0:05:54", "throughput": 4088.98, "total_tokens": 67738936} +{"current_steps": 116865, "total_steps": 119360, "loss": 0.6636, "lr": 1.33147627347463e-08, "epoch": 19.581936997319033, "percentage": 97.91, "elapsed_time": "4:36:06", "remaining_time": "0:05:53", "throughput": 4088.98, "total_tokens": 67742168} +{"current_steps": 116870, "total_steps": 119360, "loss": 0.51, "lr": 1.326149533245058e-08, "epoch": 19.582774798927613, "percentage": 97.91, "elapsed_time": "4:36:07", "remaining_time": "0:05:52", "throughput": 4089.0, "total_tokens": 67745176} +{"current_steps": 116875, "total_steps": 119360, "loss": 0.2708, "lr": 1.3208334553845293e-08, "epoch": 19.583612600536192, "percentage": 97.92, "elapsed_time": "4:36:08", "remaining_time": "0:05:52", "throughput": 4089.01, "total_tokens": 67748216} +{"current_steps": 116880, "total_steps": 119360, "loss": 0.1786, "lr": 1.315528040006675e-08, "epoch": 19.58445040214477, "percentage": 97.92, "elapsed_time": "4:36:09", "remaining_time": "0:05:51", "throughput": 4089.02, "total_tokens": 67751096} +{"current_steps": 116885, "total_steps": 119360, "loss": 0.2312, "lr": 1.3102332872249602e-08, "epoch": 19.58528820375335, "percentage": 97.93, "elapsed_time": "4:36:09", "remaining_time": "0:05:50", "throughput": 4089.02, "total_tokens": 67753784} +{"current_steps": 116890, "total_steps": 119360, "loss": 0.2025, "lr": 1.3049491971525718e-08, "epoch": 19.58612600536193, "percentage": 97.93, "elapsed_time": "4:36:10", "remaining_time": "0:05:50", "throughput": 4089.04, "total_tokens": 67756888} +{"current_steps": 116895, "total_steps": 119360, "loss": 0.4141, "lr": 1.299675769902531e-08, "epoch": 19.58696380697051, "percentage": 97.93, "elapsed_time": "4:36:11", "remaining_time": "0:05:49", "throughput": 4089.05, "total_tokens": 67759800} +{"current_steps": 116900, "total_steps": 119360, "loss": 0.2083, "lr": 1.2944130055875248e-08, "epoch": 19.58780160857909, "percentage": 97.94, "elapsed_time": "4:36:11", "remaining_time": "0:05:48", "throughput": 4089.05, "total_tokens": 67762488} +{"current_steps": 116905, "total_steps": 119360, "loss": 0.4154, "lr": 1.2891609043201302e-08, "epoch": 19.588639410187668, "percentage": 97.94, "elapsed_time": "4:36:12", "remaining_time": "0:05:48", "throughput": 4089.06, "total_tokens": 67765240} +{"current_steps": 116910, "total_steps": 119360, "loss": 0.6102, "lr": 1.2839194662126465e-08, "epoch": 19.589477211796247, "percentage": 97.95, "elapsed_time": "4:36:12", "remaining_time": "0:05:47", "throughput": 4089.07, "total_tokens": 67768088} +{"current_steps": 116915, "total_steps": 119360, "loss": 0.2933, "lr": 1.2786886913770947e-08, "epoch": 19.590315013404826, "percentage": 97.95, "elapsed_time": "4:36:13", "remaining_time": "0:05:46", "throughput": 4089.07, "total_tokens": 67770840} +{"current_steps": 116920, "total_steps": 119360, "loss": 0.1743, "lr": 1.27346857992533e-08, "epoch": 19.591152815013405, "percentage": 97.96, "elapsed_time": "4:36:14", "remaining_time": "0:05:45", "throughput": 4089.09, "total_tokens": 67773784} +{"current_steps": 116925, "total_steps": 119360, "loss": 0.2435, "lr": 1.2682591319690406e-08, "epoch": 19.591990616621985, "percentage": 97.96, "elapsed_time": "4:36:14", "remaining_time": "0:05:45", "throughput": 4089.09, "total_tokens": 67776568} +{"current_steps": 116930, "total_steps": 119360, "loss": 0.2658, "lr": 1.2630603476195269e-08, "epoch": 19.592828418230564, "percentage": 97.96, "elapsed_time": "4:36:15", "remaining_time": "0:05:44", "throughput": 4089.1, "total_tokens": 67779448} +{"current_steps": 116935, "total_steps": 119360, "loss": 0.1981, "lr": 1.2578722269879774e-08, "epoch": 19.593666219839143, "percentage": 97.97, "elapsed_time": "4:36:16", "remaining_time": "0:05:43", "throughput": 4089.11, "total_tokens": 67782136} +{"current_steps": 116940, "total_steps": 119360, "loss": 0.2518, "lr": 1.2526947701853032e-08, "epoch": 19.594504021447722, "percentage": 97.97, "elapsed_time": "4:36:16", "remaining_time": "0:05:43", "throughput": 4089.12, "total_tokens": 67785208} +{"current_steps": 116945, "total_steps": 119360, "loss": 0.3503, "lr": 1.2475279773222493e-08, "epoch": 19.5953418230563, "percentage": 97.98, "elapsed_time": "4:36:17", "remaining_time": "0:05:42", "throughput": 4089.13, "total_tokens": 67788248} +{"current_steps": 116950, "total_steps": 119360, "loss": 0.2899, "lr": 1.2423718485092274e-08, "epoch": 19.59617962466488, "percentage": 97.98, "elapsed_time": "4:36:18", "remaining_time": "0:05:41", "throughput": 4089.14, "total_tokens": 67791256} +{"current_steps": 116955, "total_steps": 119360, "loss": 0.3367, "lr": 1.2372263838565934e-08, "epoch": 19.59701742627346, "percentage": 97.99, "elapsed_time": "4:36:19", "remaining_time": "0:05:40", "throughput": 4089.15, "total_tokens": 67794168} +{"current_steps": 116960, "total_steps": 119360, "loss": 0.2169, "lr": 1.2320915834742598e-08, "epoch": 19.597855227882036, "percentage": 97.99, "elapsed_time": "4:36:19", "remaining_time": "0:05:40", "throughput": 4089.16, "total_tokens": 67797048} +{"current_steps": 116965, "total_steps": 119360, "loss": 0.2146, "lr": 1.2269674474719717e-08, "epoch": 19.598693029490615, "percentage": 97.99, "elapsed_time": "4:36:20", "remaining_time": "0:05:39", "throughput": 4089.17, "total_tokens": 67799928} +{"current_steps": 116970, "total_steps": 119360, "loss": 0.4345, "lr": 1.2218539759594195e-08, "epoch": 19.599530831099194, "percentage": 98.0, "elapsed_time": "4:36:20", "remaining_time": "0:05:38", "throughput": 4089.18, "total_tokens": 67802584} +{"current_steps": 116975, "total_steps": 119360, "loss": 0.3605, "lr": 1.2167511690459044e-08, "epoch": 19.600368632707774, "percentage": 98.0, "elapsed_time": "4:36:21", "remaining_time": "0:05:38", "throughput": 4089.18, "total_tokens": 67805432} +{"current_steps": 116980, "total_steps": 119360, "loss": 0.3474, "lr": 1.211659026840506e-08, "epoch": 19.601206434316353, "percentage": 98.01, "elapsed_time": "4:36:22", "remaining_time": "0:05:37", "throughput": 4089.19, "total_tokens": 67808152} +{"current_steps": 116985, "total_steps": 119360, "loss": 0.4424, "lr": 1.2065775494520815e-08, "epoch": 19.602044235924932, "percentage": 98.01, "elapsed_time": "4:36:23", "remaining_time": "0:05:36", "throughput": 4089.2, "total_tokens": 67811224} +{"current_steps": 116990, "total_steps": 119360, "loss": 0.3197, "lr": 1.2015067369892664e-08, "epoch": 19.60288203753351, "percentage": 98.01, "elapsed_time": "4:36:23", "remaining_time": "0:05:35", "throughput": 4089.21, "total_tokens": 67814072} +{"current_steps": 116995, "total_steps": 119360, "loss": 0.4031, "lr": 1.1964465895605848e-08, "epoch": 19.60371983914209, "percentage": 98.02, "elapsed_time": "4:36:24", "remaining_time": "0:05:35", "throughput": 4089.22, "total_tokens": 67817016} +{"current_steps": 117000, "total_steps": 119360, "loss": 0.3508, "lr": 1.1913971072741726e-08, "epoch": 19.60455764075067, "percentage": 98.02, "elapsed_time": "4:36:25", "remaining_time": "0:05:34", "throughput": 4089.22, "total_tokens": 67819960} +{"current_steps": 117005, "total_steps": 119360, "loss": 0.6163, "lr": 1.1863582902378878e-08, "epoch": 19.60539544235925, "percentage": 98.03, "elapsed_time": "4:36:25", "remaining_time": "0:05:33", "throughput": 4089.23, "total_tokens": 67822744} +{"current_steps": 117010, "total_steps": 119360, "loss": 0.3754, "lr": 1.1813301385596443e-08, "epoch": 19.60623324396783, "percentage": 98.03, "elapsed_time": "4:36:26", "remaining_time": "0:05:33", "throughput": 4089.25, "total_tokens": 67825912} +{"current_steps": 117015, "total_steps": 119360, "loss": 0.4745, "lr": 1.1763126523469116e-08, "epoch": 19.607071045576408, "percentage": 98.04, "elapsed_time": "4:36:27", "remaining_time": "0:05:32", "throughput": 4089.26, "total_tokens": 67828888} +{"current_steps": 117020, "total_steps": 119360, "loss": 0.4088, "lr": 1.171305831706826e-08, "epoch": 19.607908847184987, "percentage": 98.04, "elapsed_time": "4:36:27", "remaining_time": "0:05:31", "throughput": 4089.26, "total_tokens": 67831640} +{"current_steps": 117025, "total_steps": 119360, "loss": 0.404, "lr": 1.1663096767466354e-08, "epoch": 19.608746648793566, "percentage": 98.04, "elapsed_time": "4:36:28", "remaining_time": "0:05:30", "throughput": 4089.27, "total_tokens": 67834648} +{"current_steps": 117030, "total_steps": 119360, "loss": 0.4147, "lr": 1.161324187573032e-08, "epoch": 19.609584450402146, "percentage": 98.05, "elapsed_time": "4:36:29", "remaining_time": "0:05:30", "throughput": 4089.28, "total_tokens": 67837560} +{"current_steps": 117035, "total_steps": 119360, "loss": 0.3403, "lr": 1.1563493642926527e-08, "epoch": 19.610422252010725, "percentage": 98.05, "elapsed_time": "4:36:29", "remaining_time": "0:05:29", "throughput": 4089.29, "total_tokens": 67840536} +{"current_steps": 117040, "total_steps": 119360, "loss": 0.1545, "lr": 1.1513852070119125e-08, "epoch": 19.611260053619304, "percentage": 98.06, "elapsed_time": "4:36:30", "remaining_time": "0:05:28", "throughput": 4089.31, "total_tokens": 67843544} +{"current_steps": 117045, "total_steps": 119360, "loss": 0.4401, "lr": 1.1464317158368932e-08, "epoch": 19.612097855227884, "percentage": 98.06, "elapsed_time": "4:36:31", "remaining_time": "0:05:28", "throughput": 4089.32, "total_tokens": 67846520} +{"current_steps": 117050, "total_steps": 119360, "loss": 0.4406, "lr": 1.14148889087351e-08, "epoch": 19.612935656836463, "percentage": 98.06, "elapsed_time": "4:36:31", "remaining_time": "0:05:27", "throughput": 4089.33, "total_tokens": 67849496} +{"current_steps": 117055, "total_steps": 119360, "loss": 0.3113, "lr": 1.1365567322274563e-08, "epoch": 19.61377345844504, "percentage": 98.07, "elapsed_time": "4:36:32", "remaining_time": "0:05:26", "throughput": 4089.34, "total_tokens": 67852504} +{"current_steps": 117060, "total_steps": 119360, "loss": 0.2663, "lr": 1.1316352400042585e-08, "epoch": 19.614611260053618, "percentage": 98.07, "elapsed_time": "4:36:33", "remaining_time": "0:05:26", "throughput": 4089.36, "total_tokens": 67855544} +{"current_steps": 117065, "total_steps": 119360, "loss": 0.5052, "lr": 1.1267244143089995e-08, "epoch": 19.615449061662197, "percentage": 98.08, "elapsed_time": "4:36:33", "remaining_time": "0:05:25", "throughput": 4089.36, "total_tokens": 67858680} +{"current_steps": 117070, "total_steps": 119360, "loss": 0.3446, "lr": 1.1218242552467617e-08, "epoch": 19.616286863270776, "percentage": 98.08, "elapsed_time": "4:36:34", "remaining_time": "0:05:24", "throughput": 4089.38, "total_tokens": 67861752} +{"current_steps": 117075, "total_steps": 119360, "loss": 0.4911, "lr": 1.1169347629224058e-08, "epoch": 19.617124664879356, "percentage": 98.09, "elapsed_time": "4:36:35", "remaining_time": "0:05:23", "throughput": 4089.39, "total_tokens": 67864728} +{"current_steps": 117080, "total_steps": 119360, "loss": 0.2153, "lr": 1.1120559374403484e-08, "epoch": 19.617962466487935, "percentage": 98.09, "elapsed_time": "4:36:36", "remaining_time": "0:05:23", "throughput": 4089.4, "total_tokens": 67867768} +{"current_steps": 117085, "total_steps": 119360, "loss": 0.3733, "lr": 1.1071877789048947e-08, "epoch": 19.618800268096514, "percentage": 98.09, "elapsed_time": "4:36:36", "remaining_time": "0:05:22", "throughput": 4089.41, "total_tokens": 67870680} +{"current_steps": 117090, "total_steps": 119360, "loss": 0.505, "lr": 1.102330287420239e-08, "epoch": 19.619638069705093, "percentage": 98.1, "elapsed_time": "4:36:37", "remaining_time": "0:05:21", "throughput": 4089.42, "total_tokens": 67873624} +{"current_steps": 117095, "total_steps": 119360, "loss": 0.4254, "lr": 1.0974834630901875e-08, "epoch": 19.620475871313673, "percentage": 98.1, "elapsed_time": "4:36:38", "remaining_time": "0:05:21", "throughput": 4089.42, "total_tokens": 67876504} +{"current_steps": 117100, "total_steps": 119360, "loss": 0.2528, "lr": 1.0926473060183241e-08, "epoch": 19.621313672922252, "percentage": 98.11, "elapsed_time": "4:36:38", "remaining_time": "0:05:20", "throughput": 4089.44, "total_tokens": 67879576} +{"current_steps": 117105, "total_steps": 119360, "loss": 0.3066, "lr": 1.0878218163081766e-08, "epoch": 19.62215147453083, "percentage": 98.11, "elapsed_time": "4:36:39", "remaining_time": "0:05:19", "throughput": 4089.45, "total_tokens": 67882520} +{"current_steps": 117110, "total_steps": 119360, "loss": 0.4374, "lr": 1.0830069940627741e-08, "epoch": 19.62298927613941, "percentage": 98.11, "elapsed_time": "4:36:40", "remaining_time": "0:05:18", "throughput": 4089.46, "total_tokens": 67885336} +{"current_steps": 117115, "total_steps": 119360, "loss": 0.548, "lr": 1.0782028393851452e-08, "epoch": 19.62382707774799, "percentage": 98.12, "elapsed_time": "4:36:40", "remaining_time": "0:05:18", "throughput": 4089.47, "total_tokens": 67888184} +{"current_steps": 117120, "total_steps": 119360, "loss": 0.1598, "lr": 1.0734093523780409e-08, "epoch": 19.62466487935657, "percentage": 98.12, "elapsed_time": "4:36:41", "remaining_time": "0:05:17", "throughput": 4089.48, "total_tokens": 67891288} +{"current_steps": 117125, "total_steps": 119360, "loss": 0.3703, "lr": 1.0686265331438795e-08, "epoch": 19.62550268096515, "percentage": 98.13, "elapsed_time": "4:36:42", "remaining_time": "0:05:16", "throughput": 4089.48, "total_tokens": 67894200} +{"current_steps": 117130, "total_steps": 119360, "loss": 0.3814, "lr": 1.0638543817849678e-08, "epoch": 19.626340482573728, "percentage": 98.13, "elapsed_time": "4:36:42", "remaining_time": "0:05:16", "throughput": 4089.5, "total_tokens": 67897208} +{"current_steps": 117135, "total_steps": 119360, "loss": 0.4109, "lr": 1.0590928984033355e-08, "epoch": 19.627178284182307, "percentage": 98.14, "elapsed_time": "4:36:43", "remaining_time": "0:05:15", "throughput": 4089.5, "total_tokens": 67899960} +{"current_steps": 117140, "total_steps": 119360, "loss": 0.1736, "lr": 1.05434208310079e-08, "epoch": 19.628016085790886, "percentage": 98.14, "elapsed_time": "4:36:44", "remaining_time": "0:05:14", "throughput": 4089.51, "total_tokens": 67902680} +{"current_steps": 117145, "total_steps": 119360, "loss": 0.3587, "lr": 1.0496019359789167e-08, "epoch": 19.628853887399465, "percentage": 98.14, "elapsed_time": "4:36:44", "remaining_time": "0:05:13", "throughput": 4089.52, "total_tokens": 67905816} +{"current_steps": 117150, "total_steps": 119360, "loss": 0.3328, "lr": 1.0448724571390234e-08, "epoch": 19.62969168900804, "percentage": 98.15, "elapsed_time": "4:36:45", "remaining_time": "0:05:13", "throughput": 4089.53, "total_tokens": 67908760} +{"current_steps": 117155, "total_steps": 119360, "loss": 0.1582, "lr": 1.0401536466822514e-08, "epoch": 19.63052949061662, "percentage": 98.15, "elapsed_time": "4:36:46", "remaining_time": "0:05:12", "throughput": 4089.53, "total_tokens": 67911640} +{"current_steps": 117160, "total_steps": 119360, "loss": 0.3148, "lr": 1.0354455047095757e-08, "epoch": 19.6313672922252, "percentage": 98.16, "elapsed_time": "4:36:46", "remaining_time": "0:05:11", "throughput": 4089.54, "total_tokens": 67914712} +{"current_steps": 117165, "total_steps": 119360, "loss": 0.2724, "lr": 1.0307480313215268e-08, "epoch": 19.63220509383378, "percentage": 98.16, "elapsed_time": "4:36:47", "remaining_time": "0:05:11", "throughput": 4089.56, "total_tokens": 67917848} +{"current_steps": 117170, "total_steps": 119360, "loss": 0.4792, "lr": 1.0260612266186354e-08, "epoch": 19.633042895442358, "percentage": 98.17, "elapsed_time": "4:36:48", "remaining_time": "0:05:10", "throughput": 4089.57, "total_tokens": 67920824} +{"current_steps": 117175, "total_steps": 119360, "loss": 0.2543, "lr": 1.0213850907010991e-08, "epoch": 19.633880697050937, "percentage": 98.17, "elapsed_time": "4:36:48", "remaining_time": "0:05:09", "throughput": 4089.57, "total_tokens": 67923448} +{"current_steps": 117180, "total_steps": 119360, "loss": 0.3792, "lr": 1.0167196236688937e-08, "epoch": 19.634718498659517, "percentage": 98.17, "elapsed_time": "4:36:49", "remaining_time": "0:05:09", "throughput": 4089.58, "total_tokens": 67926296} +{"current_steps": 117185, "total_steps": 119360, "loss": 0.5043, "lr": 1.0120648256217724e-08, "epoch": 19.635556300268096, "percentage": 98.18, "elapsed_time": "4:36:50", "remaining_time": "0:05:08", "throughput": 4089.59, "total_tokens": 67929016} +{"current_steps": 117190, "total_steps": 119360, "loss": 0.338, "lr": 1.007420696659267e-08, "epoch": 19.636394101876675, "percentage": 98.18, "elapsed_time": "4:36:50", "remaining_time": "0:05:07", "throughput": 4089.6, "total_tokens": 67932216} +{"current_steps": 117195, "total_steps": 119360, "loss": 0.595, "lr": 1.0027872368806868e-08, "epoch": 19.637231903485254, "percentage": 98.19, "elapsed_time": "4:36:51", "remaining_time": "0:05:06", "throughput": 4089.61, "total_tokens": 67935096} +{"current_steps": 117200, "total_steps": 119360, "loss": 0.335, "lr": 9.981644463850638e-09, "epoch": 19.638069705093834, "percentage": 98.19, "elapsed_time": "4:36:52", "remaining_time": "0:05:06", "throughput": 4089.61, "total_tokens": 67937848} +{"current_steps": 117205, "total_steps": 119360, "loss": 0.325, "lr": 9.935523252712631e-09, "epoch": 19.638907506702413, "percentage": 98.19, "elapsed_time": "4:36:53", "remaining_time": "0:05:05", "throughput": 4089.62, "total_tokens": 67941048} +{"current_steps": 117210, "total_steps": 119360, "loss": 0.3735, "lr": 9.889508736378728e-09, "epoch": 19.639745308310992, "percentage": 98.2, "elapsed_time": "4:36:53", "remaining_time": "0:05:04", "throughput": 4089.63, "total_tokens": 67943896} +{"current_steps": 117215, "total_steps": 119360, "loss": 0.379, "lr": 9.84360091583314e-09, "epoch": 19.64058310991957, "percentage": 98.2, "elapsed_time": "4:36:54", "remaining_time": "0:05:04", "throughput": 4089.64, "total_tokens": 67946840} +{"current_steps": 117220, "total_steps": 119360, "loss": 0.2286, "lr": 9.797799792057306e-09, "epoch": 19.64142091152815, "percentage": 98.21, "elapsed_time": "4:36:55", "remaining_time": "0:05:03", "throughput": 4089.65, "total_tokens": 67949880} +{"current_steps": 117225, "total_steps": 119360, "loss": 0.177, "lr": 9.752105366030995e-09, "epoch": 19.64225871313673, "percentage": 98.21, "elapsed_time": "4:36:55", "remaining_time": "0:05:02", "throughput": 4089.67, "total_tokens": 67952824} +{"current_steps": 117230, "total_steps": 119360, "loss": 0.5746, "lr": 9.706517638730096e-09, "epoch": 19.64309651474531, "percentage": 98.22, "elapsed_time": "4:36:56", "remaining_time": "0:05:01", "throughput": 4089.67, "total_tokens": 67955768} +{"current_steps": 117235, "total_steps": 119360, "loss": 0.3072, "lr": 9.661036611130492e-09, "epoch": 19.64393431635389, "percentage": 98.22, "elapsed_time": "4:36:57", "remaining_time": "0:05:01", "throughput": 4089.68, "total_tokens": 67958392} +{"current_steps": 117240, "total_steps": 119360, "loss": 0.1952, "lr": 9.615662284204185e-09, "epoch": 19.644772117962468, "percentage": 98.22, "elapsed_time": "4:36:57", "remaining_time": "0:05:00", "throughput": 4089.68, "total_tokens": 67961208} +{"current_steps": 117245, "total_steps": 119360, "loss": 0.5408, "lr": 9.570394658920956e-09, "epoch": 19.645609919571047, "percentage": 98.23, "elapsed_time": "4:36:58", "remaining_time": "0:04:59", "throughput": 4089.69, "total_tokens": 67964024} +{"current_steps": 117250, "total_steps": 119360, "loss": 0.1251, "lr": 9.525233736248918e-09, "epoch": 19.646447721179626, "percentage": 98.23, "elapsed_time": "4:36:59", "remaining_time": "0:04:59", "throughput": 4089.7, "total_tokens": 67967064} +{"current_steps": 117255, "total_steps": 119360, "loss": 0.2996, "lr": 9.480179517153965e-09, "epoch": 19.647285522788202, "percentage": 98.24, "elapsed_time": "4:36:59", "remaining_time": "0:04:58", "throughput": 4089.71, "total_tokens": 67969752} +{"current_steps": 117260, "total_steps": 119360, "loss": 0.29, "lr": 9.43523200259977e-09, "epoch": 19.64812332439678, "percentage": 98.24, "elapsed_time": "4:37:00", "remaining_time": "0:04:57", "throughput": 4089.72, "total_tokens": 67972856} +{"current_steps": 117265, "total_steps": 119360, "loss": 0.3091, "lr": 9.390391193546122e-09, "epoch": 19.64896112600536, "percentage": 98.24, "elapsed_time": "4:37:01", "remaining_time": "0:04:56", "throughput": 4089.73, "total_tokens": 67975864} +{"current_steps": 117270, "total_steps": 119360, "loss": 0.3667, "lr": 9.345657090953364e-09, "epoch": 19.64979892761394, "percentage": 98.25, "elapsed_time": "4:37:01", "remaining_time": "0:04:56", "throughput": 4089.75, "total_tokens": 67979192} +{"current_steps": 117275, "total_steps": 119360, "loss": 0.5962, "lr": 9.301029695776286e-09, "epoch": 19.65063672922252, "percentage": 98.25, "elapsed_time": "4:37:02", "remaining_time": "0:04:55", "throughput": 4089.75, "total_tokens": 67981880} +{"current_steps": 117280, "total_steps": 119360, "loss": 0.462, "lr": 9.256509008970238e-09, "epoch": 19.6514745308311, "percentage": 98.26, "elapsed_time": "4:37:03", "remaining_time": "0:04:54", "throughput": 4089.77, "total_tokens": 67985176} +{"current_steps": 117285, "total_steps": 119360, "loss": 0.4454, "lr": 9.212095031487234e-09, "epoch": 19.652312332439678, "percentage": 98.26, "elapsed_time": "4:37:03", "remaining_time": "0:04:54", "throughput": 4089.78, "total_tokens": 67988120} +{"current_steps": 117290, "total_steps": 119360, "loss": 0.4866, "lr": 9.167787764275959e-09, "epoch": 19.653150134048257, "percentage": 98.27, "elapsed_time": "4:37:04", "remaining_time": "0:04:53", "throughput": 4089.79, "total_tokens": 67991128} +{"current_steps": 117295, "total_steps": 119360, "loss": 0.5595, "lr": 9.123587208284545e-09, "epoch": 19.653987935656836, "percentage": 98.27, "elapsed_time": "4:37:05", "remaining_time": "0:04:52", "throughput": 4089.8, "total_tokens": 67994136} +{"current_steps": 117300, "total_steps": 119360, "loss": 0.2655, "lr": 9.079493364457793e-09, "epoch": 19.654825737265416, "percentage": 98.27, "elapsed_time": "4:37:05", "remaining_time": "0:04:51", "throughput": 4089.81, "total_tokens": 67997080} +{"current_steps": 117305, "total_steps": 119360, "loss": 0.2518, "lr": 9.035506233738833e-09, "epoch": 19.655663538873995, "percentage": 98.28, "elapsed_time": "4:37:06", "remaining_time": "0:04:51", "throughput": 4089.82, "total_tokens": 68000088} +{"current_steps": 117310, "total_steps": 119360, "loss": 0.2594, "lr": 8.991625817067473e-09, "epoch": 19.656501340482574, "percentage": 98.28, "elapsed_time": "4:37:07", "remaining_time": "0:04:50", "throughput": 4089.83, "total_tokens": 68002872} +{"current_steps": 117315, "total_steps": 119360, "loss": 0.4217, "lr": 8.94785211538296e-09, "epoch": 19.657339142091153, "percentage": 98.29, "elapsed_time": "4:37:07", "remaining_time": "0:04:49", "throughput": 4089.83, "total_tokens": 68005496} +{"current_steps": 117320, "total_steps": 119360, "loss": 0.4718, "lr": 8.904185129620103e-09, "epoch": 19.658176943699733, "percentage": 98.29, "elapsed_time": "4:37:08", "remaining_time": "0:04:49", "throughput": 4089.84, "total_tokens": 68008440} +{"current_steps": 117325, "total_steps": 119360, "loss": 0.5115, "lr": 8.860624860713151e-09, "epoch": 19.659014745308312, "percentage": 98.3, "elapsed_time": "4:37:09", "remaining_time": "0:04:48", "throughput": 4089.85, "total_tokens": 68011832} +{"current_steps": 117330, "total_steps": 119360, "loss": 0.5031, "lr": 8.817171309593587e-09, "epoch": 19.65985254691689, "percentage": 98.3, "elapsed_time": "4:37:10", "remaining_time": "0:04:47", "throughput": 4089.86, "total_tokens": 68014552} +{"current_steps": 117335, "total_steps": 119360, "loss": 0.6425, "lr": 8.773824477190107e-09, "epoch": 19.66069034852547, "percentage": 98.3, "elapsed_time": "4:37:10", "remaining_time": "0:04:47", "throughput": 4089.86, "total_tokens": 68017144} +{"current_steps": 117340, "total_steps": 119360, "loss": 0.3472, "lr": 8.73058436442975e-09, "epoch": 19.66152815013405, "percentage": 98.31, "elapsed_time": "4:37:11", "remaining_time": "0:04:46", "throughput": 4089.86, "total_tokens": 68019768} +{"current_steps": 117345, "total_steps": 119360, "loss": 0.2049, "lr": 8.687450972237332e-09, "epoch": 19.66236595174263, "percentage": 98.31, "elapsed_time": "4:37:11", "remaining_time": "0:04:45", "throughput": 4089.87, "total_tokens": 68022584} +{"current_steps": 117350, "total_steps": 119360, "loss": 0.5212, "lr": 8.644424301534892e-09, "epoch": 19.663203753351205, "percentage": 98.32, "elapsed_time": "4:37:12", "remaining_time": "0:04:44", "throughput": 4089.89, "total_tokens": 68025560} +{"current_steps": 117355, "total_steps": 119360, "loss": 0.3186, "lr": 8.601504353241696e-09, "epoch": 19.664041554959784, "percentage": 98.32, "elapsed_time": "4:37:13", "remaining_time": "0:04:44", "throughput": 4089.89, "total_tokens": 68028632} +{"current_steps": 117360, "total_steps": 119360, "loss": 0.2619, "lr": 8.558691128277009e-09, "epoch": 19.664879356568363, "percentage": 98.32, "elapsed_time": "4:37:14", "remaining_time": "0:04:43", "throughput": 4089.9, "total_tokens": 68031608} +{"current_steps": 117365, "total_steps": 119360, "loss": 0.2529, "lr": 8.515984627554541e-09, "epoch": 19.665717158176943, "percentage": 98.33, "elapsed_time": "4:37:14", "remaining_time": "0:04:42", "throughput": 4089.91, "total_tokens": 68034648} +{"current_steps": 117370, "total_steps": 119360, "loss": 0.4078, "lr": 8.473384851988564e-09, "epoch": 19.666554959785522, "percentage": 98.33, "elapsed_time": "4:37:15", "remaining_time": "0:04:42", "throughput": 4089.92, "total_tokens": 68037464} +{"current_steps": 117375, "total_steps": 119360, "loss": 0.4913, "lr": 8.430891802490015e-09, "epoch": 19.6673927613941, "percentage": 98.34, "elapsed_time": "4:37:16", "remaining_time": "0:04:41", "throughput": 4089.93, "total_tokens": 68040184} +{"current_steps": 117380, "total_steps": 119360, "loss": 0.5211, "lr": 8.388505479966502e-09, "epoch": 19.66823056300268, "percentage": 98.34, "elapsed_time": "4:37:16", "remaining_time": "0:04:40", "throughput": 4089.93, "total_tokens": 68042840} +{"current_steps": 117385, "total_steps": 119360, "loss": 0.2562, "lr": 8.346225885324522e-09, "epoch": 19.66906836461126, "percentage": 98.35, "elapsed_time": "4:37:17", "remaining_time": "0:04:39", "throughput": 4089.94, "total_tokens": 68045816} +{"current_steps": 117390, "total_steps": 119360, "loss": 0.2154, "lr": 8.304053019468905e-09, "epoch": 19.66990616621984, "percentage": 98.35, "elapsed_time": "4:37:18", "remaining_time": "0:04:39", "throughput": 4089.95, "total_tokens": 68048760} +{"current_steps": 117395, "total_steps": 119360, "loss": 0.292, "lr": 8.261986883300599e-09, "epoch": 19.670743967828418, "percentage": 98.35, "elapsed_time": "4:37:18", "remaining_time": "0:04:38", "throughput": 4089.95, "total_tokens": 68051512} +{"current_steps": 117400, "total_steps": 119360, "loss": 0.2971, "lr": 8.22002747771944e-09, "epoch": 19.671581769436997, "percentage": 98.36, "elapsed_time": "4:37:19", "remaining_time": "0:04:37", "throughput": 4089.97, "total_tokens": 68054424} +{"current_steps": 117405, "total_steps": 119360, "loss": 0.2852, "lr": 8.178174803622485e-09, "epoch": 19.672419571045577, "percentage": 98.36, "elapsed_time": "4:37:20", "remaining_time": "0:04:37", "throughput": 4089.98, "total_tokens": 68057400} +{"current_steps": 117410, "total_steps": 119360, "loss": 0.26, "lr": 8.136428861904022e-09, "epoch": 19.673257372654156, "percentage": 98.37, "elapsed_time": "4:37:20", "remaining_time": "0:04:36", "throughput": 4089.99, "total_tokens": 68060408} +{"current_steps": 117415, "total_steps": 119360, "loss": 0.2162, "lr": 8.09478965345778e-09, "epoch": 19.674095174262735, "percentage": 98.37, "elapsed_time": "4:37:21", "remaining_time": "0:04:35", "throughput": 4090.0, "total_tokens": 68063512} +{"current_steps": 117420, "total_steps": 119360, "loss": 0.1778, "lr": 8.053257179173047e-09, "epoch": 19.674932975871315, "percentage": 98.37, "elapsed_time": "4:37:22", "remaining_time": "0:04:34", "throughput": 4090.01, "total_tokens": 68066360} +{"current_steps": 117425, "total_steps": 119360, "loss": 0.2904, "lr": 8.011831439938e-09, "epoch": 19.675770777479894, "percentage": 98.38, "elapsed_time": "4:37:22", "remaining_time": "0:04:34", "throughput": 4090.02, "total_tokens": 68069496} +{"current_steps": 117430, "total_steps": 119360, "loss": 0.184, "lr": 7.970512436639155e-09, "epoch": 19.676608579088473, "percentage": 98.38, "elapsed_time": "4:37:23", "remaining_time": "0:04:33", "throughput": 4090.03, "total_tokens": 68072440} +{"current_steps": 117435, "total_steps": 119360, "loss": 0.4186, "lr": 7.929300170159138e-09, "epoch": 19.677446380697052, "percentage": 98.39, "elapsed_time": "4:37:24", "remaining_time": "0:04:32", "throughput": 4090.04, "total_tokens": 68075512} +{"current_steps": 117440, "total_steps": 119360, "loss": 0.2577, "lr": 7.88819464137891e-09, "epoch": 19.67828418230563, "percentage": 98.39, "elapsed_time": "4:37:24", "remaining_time": "0:04:32", "throughput": 4090.05, "total_tokens": 68078232} +{"current_steps": 117445, "total_steps": 119360, "loss": 0.4105, "lr": 7.847195851178879e-09, "epoch": 19.679121983914207, "percentage": 98.4, "elapsed_time": "4:37:25", "remaining_time": "0:04:31", "throughput": 4090.05, "total_tokens": 68081048} +{"current_steps": 117450, "total_steps": 119360, "loss": 0.2242, "lr": 7.8063038004339e-09, "epoch": 19.679959785522787, "percentage": 98.4, "elapsed_time": "4:37:26", "remaining_time": "0:04:30", "throughput": 4090.06, "total_tokens": 68083960} +{"current_steps": 117455, "total_steps": 119360, "loss": 0.4271, "lr": 7.765518490019386e-09, "epoch": 19.680797587131366, "percentage": 98.4, "elapsed_time": "4:37:26", "remaining_time": "0:04:29", "throughput": 4090.07, "total_tokens": 68086808} +{"current_steps": 117460, "total_steps": 119360, "loss": 0.2778, "lr": 7.72483992080686e-09, "epoch": 19.681635388739945, "percentage": 98.41, "elapsed_time": "4:37:27", "remaining_time": "0:04:29", "throughput": 4090.08, "total_tokens": 68089784} +{"current_steps": 117465, "total_steps": 119360, "loss": 0.4626, "lr": 7.684268093666735e-09, "epoch": 19.682473190348524, "percentage": 98.41, "elapsed_time": "4:37:28", "remaining_time": "0:04:28", "throughput": 4090.08, "total_tokens": 68092280} +{"current_steps": 117470, "total_steps": 119360, "loss": 0.2778, "lr": 7.643803009465544e-09, "epoch": 19.683310991957104, "percentage": 98.42, "elapsed_time": "4:37:28", "remaining_time": "0:04:27", "throughput": 4090.1, "total_tokens": 68095384} +{"current_steps": 117475, "total_steps": 119360, "loss": 0.4081, "lr": 7.60344466906926e-09, "epoch": 19.684148793565683, "percentage": 98.42, "elapsed_time": "4:37:29", "remaining_time": "0:04:27", "throughput": 4090.11, "total_tokens": 68098424} +{"current_steps": 117480, "total_steps": 119360, "loss": 0.6468, "lr": 7.563193073340525e-09, "epoch": 19.684986595174262, "percentage": 98.42, "elapsed_time": "4:37:30", "remaining_time": "0:04:26", "throughput": 4090.12, "total_tokens": 68101176} +{"current_steps": 117485, "total_steps": 119360, "loss": 0.4265, "lr": 7.523048223139762e-09, "epoch": 19.68582439678284, "percentage": 98.43, "elapsed_time": "4:37:30", "remaining_time": "0:04:25", "throughput": 4090.13, "total_tokens": 68104056} +{"current_steps": 117490, "total_steps": 119360, "loss": 0.3383, "lr": 7.483010119325728e-09, "epoch": 19.68666219839142, "percentage": 98.43, "elapsed_time": "4:37:31", "remaining_time": "0:04:25", "throughput": 4090.13, "total_tokens": 68106808} +{"current_steps": 117495, "total_steps": 119360, "loss": 0.1896, "lr": 7.443078762754407e-09, "epoch": 19.6875, "percentage": 98.44, "elapsed_time": "4:37:32", "remaining_time": "0:04:24", "throughput": 4090.14, "total_tokens": 68109816} +{"current_steps": 117500, "total_steps": 119360, "loss": 0.5177, "lr": 7.40325415427956e-09, "epoch": 19.68833780160858, "percentage": 98.44, "elapsed_time": "4:37:32", "remaining_time": "0:04:23", "throughput": 4090.15, "total_tokens": 68112664} +{"current_steps": 117505, "total_steps": 119360, "loss": 0.4692, "lr": 7.363536294752172e-09, "epoch": 19.68917560321716, "percentage": 98.45, "elapsed_time": "4:37:33", "remaining_time": "0:04:22", "throughput": 4090.16, "total_tokens": 68115384} +{"current_steps": 117510, "total_steps": 119360, "loss": 0.1703, "lr": 7.323925185022673e-09, "epoch": 19.690013404825738, "percentage": 98.45, "elapsed_time": "4:37:34", "remaining_time": "0:04:22", "throughput": 4090.16, "total_tokens": 68118200} +{"current_steps": 117515, "total_steps": 119360, "loss": 0.3473, "lr": 7.2844208259365e-09, "epoch": 19.690851206434317, "percentage": 98.45, "elapsed_time": "4:37:34", "remaining_time": "0:04:21", "throughput": 4090.17, "total_tokens": 68121080} +{"current_steps": 117520, "total_steps": 119360, "loss": 0.3184, "lr": 7.245023218339642e-09, "epoch": 19.691689008042896, "percentage": 98.46, "elapsed_time": "4:37:35", "remaining_time": "0:04:20", "throughput": 4090.18, "total_tokens": 68123960} +{"current_steps": 117525, "total_steps": 119360, "loss": 0.2572, "lr": 7.2057323630736475e-09, "epoch": 19.692526809651476, "percentage": 98.46, "elapsed_time": "4:37:36", "remaining_time": "0:04:20", "throughput": 4090.19, "total_tokens": 68126616} +{"current_steps": 117530, "total_steps": 119360, "loss": 0.3539, "lr": 7.166548260978956e-09, "epoch": 19.693364611260055, "percentage": 98.47, "elapsed_time": "4:37:36", "remaining_time": "0:04:19", "throughput": 4090.2, "total_tokens": 68129400} +{"current_steps": 117535, "total_steps": 119360, "loss": 0.3422, "lr": 7.1274709128932306e-09, "epoch": 19.694202412868634, "percentage": 98.47, "elapsed_time": "4:37:37", "remaining_time": "0:04:18", "throughput": 4090.21, "total_tokens": 68132248} +{"current_steps": 117540, "total_steps": 119360, "loss": 0.3065, "lr": 7.088500319651914e-09, "epoch": 19.695040214477213, "percentage": 98.48, "elapsed_time": "4:37:38", "remaining_time": "0:04:17", "throughput": 4090.21, "total_tokens": 68135160} +{"current_steps": 117545, "total_steps": 119360, "loss": 0.1681, "lr": 7.049636482088784e-09, "epoch": 19.695878016085793, "percentage": 98.48, "elapsed_time": "4:37:38", "remaining_time": "0:04:17", "throughput": 4090.22, "total_tokens": 68137912} +{"current_steps": 117550, "total_steps": 119360, "loss": 0.3046, "lr": 7.010879401034287e-09, "epoch": 19.69671581769437, "percentage": 98.48, "elapsed_time": "4:37:39", "remaining_time": "0:04:16", "throughput": 4090.22, "total_tokens": 68140664} +{"current_steps": 117555, "total_steps": 119360, "loss": 0.3624, "lr": 6.972229077317205e-09, "epoch": 19.697553619302948, "percentage": 98.49, "elapsed_time": "4:37:40", "remaining_time": "0:04:15", "throughput": 4090.23, "total_tokens": 68143416} +{"current_steps": 117560, "total_steps": 119360, "loss": 0.3692, "lr": 6.933685511763544e-09, "epoch": 19.698391420911527, "percentage": 98.49, "elapsed_time": "4:37:40", "remaining_time": "0:04:15", "throughput": 4090.24, "total_tokens": 68146264} +{"current_steps": 117565, "total_steps": 119360, "loss": 0.3265, "lr": 6.895248705198754e-09, "epoch": 19.699229222520106, "percentage": 98.5, "elapsed_time": "4:37:41", "remaining_time": "0:04:14", "throughput": 4090.24, "total_tokens": 68148920} +{"current_steps": 117570, "total_steps": 119360, "loss": 0.2451, "lr": 6.85691865844329e-09, "epoch": 19.700067024128685, "percentage": 98.5, "elapsed_time": "4:37:41", "remaining_time": "0:04:13", "throughput": 4090.24, "total_tokens": 68151480} +{"current_steps": 117575, "total_steps": 119360, "loss": 0.4881, "lr": 6.818695372317053e-09, "epoch": 19.700904825737265, "percentage": 98.5, "elapsed_time": "4:37:42", "remaining_time": "0:04:12", "throughput": 4090.25, "total_tokens": 68154360} +{"current_steps": 117580, "total_steps": 119360, "loss": 0.4705, "lr": 6.78057884763772e-09, "epoch": 19.701742627345844, "percentage": 98.51, "elapsed_time": "4:37:43", "remaining_time": "0:04:12", "throughput": 4090.26, "total_tokens": 68157304} +{"current_steps": 117585, "total_steps": 119360, "loss": 0.1967, "lr": 6.742569085219641e-09, "epoch": 19.702580428954423, "percentage": 98.51, "elapsed_time": "4:37:43", "remaining_time": "0:04:11", "throughput": 4090.27, "total_tokens": 68160120} +{"current_steps": 117590, "total_steps": 119360, "loss": 0.6622, "lr": 6.70466608587661e-09, "epoch": 19.703418230563003, "percentage": 98.52, "elapsed_time": "4:37:44", "remaining_time": "0:04:10", "throughput": 4090.28, "total_tokens": 68163096} +{"current_steps": 117595, "total_steps": 119360, "loss": 0.4523, "lr": 6.6668698504174236e-09, "epoch": 19.704256032171582, "percentage": 98.52, "elapsed_time": "4:37:45", "remaining_time": "0:04:10", "throughput": 4090.28, "total_tokens": 68165848} +{"current_steps": 117600, "total_steps": 119360, "loss": 0.3402, "lr": 6.6291803796519895e-09, "epoch": 19.70509383378016, "percentage": 98.53, "elapsed_time": "4:37:46", "remaining_time": "0:04:09", "throughput": 4090.29, "total_tokens": 68168856} +{"current_steps": 117605, "total_steps": 119360, "loss": 0.3849, "lr": 6.5915976743846644e-09, "epoch": 19.70593163538874, "percentage": 98.53, "elapsed_time": "4:37:46", "remaining_time": "0:04:08", "throughput": 4090.3, "total_tokens": 68171704} +{"current_steps": 117610, "total_steps": 119360, "loss": 0.3108, "lr": 6.554121735419805e-09, "epoch": 19.70676943699732, "percentage": 98.53, "elapsed_time": "4:37:47", "remaining_time": "0:04:08", "throughput": 4090.31, "total_tokens": 68174808} +{"current_steps": 117615, "total_steps": 119360, "loss": 0.2695, "lr": 6.516752563558993e-09, "epoch": 19.7076072386059, "percentage": 98.54, "elapsed_time": "4:37:48", "remaining_time": "0:04:07", "throughput": 4090.32, "total_tokens": 68177592} +{"current_steps": 117620, "total_steps": 119360, "loss": 0.3359, "lr": 6.479490159599922e-09, "epoch": 19.708445040214478, "percentage": 98.54, "elapsed_time": "4:37:48", "remaining_time": "0:04:06", "throughput": 4090.33, "total_tokens": 68180472} +{"current_steps": 117625, "total_steps": 119360, "loss": 0.3574, "lr": 6.442334524340843e-09, "epoch": 19.709282841823057, "percentage": 98.55, "elapsed_time": "4:37:49", "remaining_time": "0:04:05", "throughput": 4090.33, "total_tokens": 68183416} +{"current_steps": 117630, "total_steps": 119360, "loss": 0.2887, "lr": 6.405285658575566e-09, "epoch": 19.710120643431637, "percentage": 98.55, "elapsed_time": "4:37:50", "remaining_time": "0:04:05", "throughput": 4090.34, "total_tokens": 68186072} +{"current_steps": 117635, "total_steps": 119360, "loss": 0.2676, "lr": 6.36834356309568e-09, "epoch": 19.710958445040216, "percentage": 98.55, "elapsed_time": "4:37:50", "remaining_time": "0:04:04", "throughput": 4090.34, "total_tokens": 68189048} +{"current_steps": 117640, "total_steps": 119360, "loss": 0.4663, "lr": 6.331508238692219e-09, "epoch": 19.711796246648795, "percentage": 98.56, "elapsed_time": "4:37:51", "remaining_time": "0:04:03", "throughput": 4090.35, "total_tokens": 68192088} +{"current_steps": 117645, "total_steps": 119360, "loss": 0.3623, "lr": 6.294779686151775e-09, "epoch": 19.71263404825737, "percentage": 98.56, "elapsed_time": "4:37:52", "remaining_time": "0:04:03", "throughput": 4090.36, "total_tokens": 68194776} +{"current_steps": 117650, "total_steps": 119360, "loss": 0.4294, "lr": 6.258157906260387e-09, "epoch": 19.71347184986595, "percentage": 98.57, "elapsed_time": "4:37:52", "remaining_time": "0:04:02", "throughput": 4090.37, "total_tokens": 68197624} +{"current_steps": 117655, "total_steps": 119360, "loss": 0.4213, "lr": 6.221642899800207e-09, "epoch": 19.71430965147453, "percentage": 98.57, "elapsed_time": "4:37:53", "remaining_time": "0:04:01", "throughput": 4090.37, "total_tokens": 68200376} +{"current_steps": 117660, "total_steps": 119360, "loss": 0.3917, "lr": 6.1852346675528305e-09, "epoch": 19.71514745308311, "percentage": 98.58, "elapsed_time": "4:37:54", "remaining_time": "0:04:00", "throughput": 4090.38, "total_tokens": 68203288} +{"current_steps": 117665, "total_steps": 119360, "loss": 0.3274, "lr": 6.148933210296526e-09, "epoch": 19.715985254691688, "percentage": 98.58, "elapsed_time": "4:37:54", "remaining_time": "0:04:00", "throughput": 4090.39, "total_tokens": 68205944} +{"current_steps": 117670, "total_steps": 119360, "loss": 0.3826, "lr": 6.112738528807338e-09, "epoch": 19.716823056300267, "percentage": 98.58, "elapsed_time": "4:37:55", "remaining_time": "0:03:59", "throughput": 4090.4, "total_tokens": 68208984} +{"current_steps": 117675, "total_steps": 119360, "loss": 0.2953, "lr": 6.0766506238590924e-09, "epoch": 19.717660857908847, "percentage": 98.59, "elapsed_time": "4:37:56", "remaining_time": "0:03:58", "throughput": 4090.41, "total_tokens": 68211864} +{"current_steps": 117680, "total_steps": 119360, "loss": 0.3097, "lr": 6.040669496223395e-09, "epoch": 19.718498659517426, "percentage": 98.59, "elapsed_time": "4:37:56", "remaining_time": "0:03:58", "throughput": 4090.42, "total_tokens": 68214648} +{"current_steps": 117685, "total_steps": 119360, "loss": 0.4064, "lr": 6.0047951466696285e-09, "epoch": 19.719336461126005, "percentage": 98.6, "elapsed_time": "4:37:57", "remaining_time": "0:03:57", "throughput": 4090.42, "total_tokens": 68217368} +{"current_steps": 117690, "total_steps": 119360, "loss": 0.302, "lr": 5.969027575964959e-09, "epoch": 19.720174262734584, "percentage": 98.6, "elapsed_time": "4:37:58", "remaining_time": "0:03:56", "throughput": 4090.43, "total_tokens": 68220344} +{"current_steps": 117695, "total_steps": 119360, "loss": 0.2825, "lr": 5.933366784873773e-09, "epoch": 19.721012064343164, "percentage": 98.61, "elapsed_time": "4:37:58", "remaining_time": "0:03:55", "throughput": 4090.44, "total_tokens": 68223128} +{"current_steps": 117700, "total_steps": 119360, "loss": 0.2326, "lr": 5.897812774158796e-09, "epoch": 19.721849865951743, "percentage": 98.61, "elapsed_time": "4:37:59", "remaining_time": "0:03:55", "throughput": 4090.45, "total_tokens": 68226264} +{"current_steps": 117705, "total_steps": 119360, "loss": 0.2848, "lr": 5.862365544580528e-09, "epoch": 19.722687667560322, "percentage": 98.61, "elapsed_time": "4:38:00", "remaining_time": "0:03:54", "throughput": 4090.46, "total_tokens": 68229304} +{"current_steps": 117710, "total_steps": 119360, "loss": 0.3573, "lr": 5.827025096896699e-09, "epoch": 19.7235254691689, "percentage": 98.62, "elapsed_time": "4:38:00", "remaining_time": "0:03:53", "throughput": 4090.46, "total_tokens": 68231960} +{"current_steps": 117715, "total_steps": 119360, "loss": 0.2261, "lr": 5.791791431862815e-09, "epoch": 19.72436327077748, "percentage": 98.62, "elapsed_time": "4:38:01", "remaining_time": "0:03:53", "throughput": 4090.47, "total_tokens": 68235064} +{"current_steps": 117720, "total_steps": 119360, "loss": 0.4406, "lr": 5.75666455023216e-09, "epoch": 19.72520107238606, "percentage": 98.63, "elapsed_time": "4:38:02", "remaining_time": "0:03:52", "throughput": 4090.48, "total_tokens": 68237848} +{"current_steps": 117725, "total_steps": 119360, "loss": 0.2414, "lr": 5.721644452755803e-09, "epoch": 19.72603887399464, "percentage": 98.63, "elapsed_time": "4:38:02", "remaining_time": "0:03:51", "throughput": 4090.48, "total_tokens": 68240664} +{"current_steps": 117730, "total_steps": 119360, "loss": 0.4786, "lr": 5.686731140183144e-09, "epoch": 19.72687667560322, "percentage": 98.63, "elapsed_time": "4:38:03", "remaining_time": "0:03:50", "throughput": 4090.5, "total_tokens": 68243736} +{"current_steps": 117735, "total_steps": 119360, "loss": 0.4501, "lr": 5.651924613259696e-09, "epoch": 19.727714477211798, "percentage": 98.64, "elapsed_time": "4:38:04", "remaining_time": "0:03:50", "throughput": 4090.5, "total_tokens": 68246520} +{"current_steps": 117740, "total_steps": 119360, "loss": 0.6946, "lr": 5.617224872729865e-09, "epoch": 19.728552278820374, "percentage": 98.64, "elapsed_time": "4:38:04", "remaining_time": "0:03:49", "throughput": 4090.52, "total_tokens": 68249848} +{"current_steps": 117745, "total_steps": 119360, "loss": 0.297, "lr": 5.5826319193363894e-09, "epoch": 19.729390080428953, "percentage": 98.65, "elapsed_time": "4:38:05", "remaining_time": "0:03:48", "throughput": 4090.53, "total_tokens": 68252664} +{"current_steps": 117750, "total_steps": 119360, "loss": 0.2505, "lr": 5.548145753818124e-09, "epoch": 19.730227882037532, "percentage": 98.65, "elapsed_time": "4:38:06", "remaining_time": "0:03:48", "throughput": 4090.53, "total_tokens": 68255480} +{"current_steps": 117755, "total_steps": 119360, "loss": 0.1938, "lr": 5.51376637691281e-09, "epoch": 19.73106568364611, "percentage": 98.66, "elapsed_time": "4:38:06", "remaining_time": "0:03:47", "throughput": 4090.54, "total_tokens": 68258360} +{"current_steps": 117760, "total_steps": 119360, "loss": 0.4673, "lr": 5.479493789355416e-09, "epoch": 19.73190348525469, "percentage": 98.66, "elapsed_time": "4:38:07", "remaining_time": "0:03:46", "throughput": 4090.55, "total_tokens": 68261080} +{"current_steps": 117765, "total_steps": 119360, "loss": 0.4112, "lr": 5.445327991878136e-09, "epoch": 19.73274128686327, "percentage": 98.66, "elapsed_time": "4:38:08", "remaining_time": "0:03:46", "throughput": 4090.55, "total_tokens": 68264056} +{"current_steps": 117770, "total_steps": 119360, "loss": 0.4789, "lr": 5.411268985212603e-09, "epoch": 19.73357908847185, "percentage": 98.67, "elapsed_time": "4:38:08", "remaining_time": "0:03:45", "throughput": 4090.56, "total_tokens": 68266936} +{"current_steps": 117775, "total_steps": 119360, "loss": 0.1771, "lr": 5.3773167700865716e-09, "epoch": 19.73441689008043, "percentage": 98.67, "elapsed_time": "4:38:09", "remaining_time": "0:03:44", "throughput": 4090.57, "total_tokens": 68269816} +{"current_steps": 117780, "total_steps": 119360, "loss": 0.4804, "lr": 5.343471347226126e-09, "epoch": 19.735254691689008, "percentage": 98.68, "elapsed_time": "4:38:10", "remaining_time": "0:03:43", "throughput": 4090.57, "total_tokens": 68272504} +{"current_steps": 117785, "total_steps": 119360, "loss": 0.3683, "lr": 5.309732717354021e-09, "epoch": 19.736092493297587, "percentage": 98.68, "elapsed_time": "4:38:10", "remaining_time": "0:03:43", "throughput": 4090.58, "total_tokens": 68275480} +{"current_steps": 117790, "total_steps": 119360, "loss": 0.1891, "lr": 5.2761008811930134e-09, "epoch": 19.736930294906166, "percentage": 98.68, "elapsed_time": "4:38:11", "remaining_time": "0:03:42", "throughput": 4090.59, "total_tokens": 68278200} +{"current_steps": 117795, "total_steps": 119360, "loss": 0.3295, "lr": 5.242575839461417e-09, "epoch": 19.737768096514746, "percentage": 98.69, "elapsed_time": "4:38:12", "remaining_time": "0:03:41", "throughput": 4090.59, "total_tokens": 68281112} +{"current_steps": 117800, "total_steps": 119360, "loss": 0.3122, "lr": 5.20915759287588e-09, "epoch": 19.738605898123325, "percentage": 98.69, "elapsed_time": "4:38:12", "remaining_time": "0:03:41", "throughput": 4090.6, "total_tokens": 68283864} +{"current_steps": 117805, "total_steps": 119360, "loss": 0.324, "lr": 5.175846142151386e-09, "epoch": 19.739443699731904, "percentage": 98.7, "elapsed_time": "4:38:13", "remaining_time": "0:03:40", "throughput": 4090.61, "total_tokens": 68286520} +{"current_steps": 117810, "total_steps": 119360, "loss": 0.2624, "lr": 5.142641488000144e-09, "epoch": 19.740281501340483, "percentage": 98.7, "elapsed_time": "4:38:14", "remaining_time": "0:03:39", "throughput": 4090.61, "total_tokens": 68289144} +{"current_steps": 117815, "total_steps": 119360, "loss": 0.5158, "lr": 5.109543631132141e-09, "epoch": 19.741119302949063, "percentage": 98.71, "elapsed_time": "4:38:14", "remaining_time": "0:03:38", "throughput": 4090.62, "total_tokens": 68292056} +{"current_steps": 117820, "total_steps": 119360, "loss": 0.3814, "lr": 5.07655257225459e-09, "epoch": 19.741957104557642, "percentage": 98.71, "elapsed_time": "4:38:15", "remaining_time": "0:03:38", "throughput": 4090.63, "total_tokens": 68295064} +{"current_steps": 117825, "total_steps": 119360, "loss": 0.6296, "lr": 5.043668312073036e-09, "epoch": 19.74279490616622, "percentage": 98.71, "elapsed_time": "4:38:16", "remaining_time": "0:03:37", "throughput": 4090.63, "total_tokens": 68297656} +{"current_steps": 117830, "total_steps": 119360, "loss": 0.0981, "lr": 5.010890851291361e-09, "epoch": 19.7436327077748, "percentage": 98.72, "elapsed_time": "4:38:16", "remaining_time": "0:03:36", "throughput": 4090.64, "total_tokens": 68300632} +{"current_steps": 117835, "total_steps": 119360, "loss": 0.264, "lr": 4.978220190609562e-09, "epoch": 19.74447050938338, "percentage": 98.72, "elapsed_time": "4:38:17", "remaining_time": "0:03:36", "throughput": 4090.64, "total_tokens": 68303416} +{"current_steps": 117840, "total_steps": 119360, "loss": 0.2345, "lr": 4.945656330725968e-09, "epoch": 19.74530831099196, "percentage": 98.73, "elapsed_time": "4:38:18", "remaining_time": "0:03:35", "throughput": 4090.65, "total_tokens": 68306040} +{"current_steps": 117845, "total_steps": 119360, "loss": 0.2694, "lr": 4.913199272337799e-09, "epoch": 19.746146112600535, "percentage": 98.73, "elapsed_time": "4:38:18", "remaining_time": "0:03:34", "throughput": 4090.66, "total_tokens": 68309176} +{"current_steps": 117850, "total_steps": 119360, "loss": 0.168, "lr": 4.8808490161383895e-09, "epoch": 19.746983914209114, "percentage": 98.73, "elapsed_time": "4:38:19", "remaining_time": "0:03:33", "throughput": 4090.67, "total_tokens": 68312152} +{"current_steps": 117855, "total_steps": 119360, "loss": 0.2884, "lr": 4.848605562819409e-09, "epoch": 19.747821715817693, "percentage": 98.74, "elapsed_time": "4:38:20", "remaining_time": "0:03:33", "throughput": 4090.69, "total_tokens": 68315128} +{"current_steps": 117860, "total_steps": 119360, "loss": 0.3237, "lr": 4.8164689130708596e-09, "epoch": 19.748659517426272, "percentage": 98.74, "elapsed_time": "4:38:20", "remaining_time": "0:03:32", "throughput": 4090.7, "total_tokens": 68318232} +{"current_steps": 117865, "total_steps": 119360, "loss": 0.3063, "lr": 4.784439067579416e-09, "epoch": 19.74949731903485, "percentage": 98.75, "elapsed_time": "4:38:21", "remaining_time": "0:03:31", "throughput": 4090.71, "total_tokens": 68321208} +{"current_steps": 117870, "total_steps": 119360, "loss": 0.4179, "lr": 4.75251602702953e-09, "epoch": 19.75033512064343, "percentage": 98.75, "elapsed_time": "4:38:22", "remaining_time": "0:03:31", "throughput": 4090.72, "total_tokens": 68324504} +{"current_steps": 117875, "total_steps": 119360, "loss": 0.1606, "lr": 4.720699792103989e-09, "epoch": 19.75117292225201, "percentage": 98.76, "elapsed_time": "4:38:23", "remaining_time": "0:03:30", "throughput": 4090.73, "total_tokens": 68327672} +{"current_steps": 117880, "total_steps": 119360, "loss": 0.311, "lr": 4.688990363483914e-09, "epoch": 19.75201072386059, "percentage": 98.76, "elapsed_time": "4:38:23", "remaining_time": "0:03:29", "throughput": 4090.74, "total_tokens": 68330680} +{"current_steps": 117885, "total_steps": 119360, "loss": 0.1371, "lr": 4.657387741846542e-09, "epoch": 19.75284852546917, "percentage": 98.76, "elapsed_time": "4:38:24", "remaining_time": "0:03:29", "throughput": 4090.75, "total_tokens": 68333528} +{"current_steps": 117890, "total_steps": 119360, "loss": 0.4933, "lr": 4.625891927867443e-09, "epoch": 19.753686327077748, "percentage": 98.77, "elapsed_time": "4:38:25", "remaining_time": "0:03:28", "throughput": 4090.76, "total_tokens": 68336408} +{"current_steps": 117895, "total_steps": 119360, "loss": 0.5303, "lr": 4.5945029222205225e-09, "epoch": 19.754524128686327, "percentage": 98.77, "elapsed_time": "4:38:25", "remaining_time": "0:03:27", "throughput": 4090.76, "total_tokens": 68339064} +{"current_steps": 117900, "total_steps": 119360, "loss": 0.2513, "lr": 4.563220725576356e-09, "epoch": 19.755361930294907, "percentage": 98.78, "elapsed_time": "4:38:26", "remaining_time": "0:03:26", "throughput": 4090.77, "total_tokens": 68341784} +{"current_steps": 117905, "total_steps": 119360, "loss": 0.2608, "lr": 4.5320453386044075e-09, "epoch": 19.756199731903486, "percentage": 98.78, "elapsed_time": "4:38:26", "remaining_time": "0:03:26", "throughput": 4090.77, "total_tokens": 68344440} +{"current_steps": 117910, "total_steps": 119360, "loss": 0.3144, "lr": 4.50097676197081e-09, "epoch": 19.757037533512065, "percentage": 98.79, "elapsed_time": "4:38:27", "remaining_time": "0:03:25", "throughput": 4090.78, "total_tokens": 68347224} +{"current_steps": 117915, "total_steps": 119360, "loss": 0.3341, "lr": 4.470014996340588e-09, "epoch": 19.757875335120644, "percentage": 98.79, "elapsed_time": "4:38:28", "remaining_time": "0:03:24", "throughput": 4090.79, "total_tokens": 68350008} +{"current_steps": 117920, "total_steps": 119360, "loss": 0.1957, "lr": 4.439160042374324e-09, "epoch": 19.758713136729224, "percentage": 98.79, "elapsed_time": "4:38:28", "remaining_time": "0:03:24", "throughput": 4090.79, "total_tokens": 68352728} +{"current_steps": 117925, "total_steps": 119360, "loss": 0.2427, "lr": 4.408411900733156e-09, "epoch": 19.759550938337803, "percentage": 98.8, "elapsed_time": "4:38:29", "remaining_time": "0:03:23", "throughput": 4090.8, "total_tokens": 68355608} +{"current_steps": 117930, "total_steps": 119360, "loss": 0.2338, "lr": 4.37777057207378e-09, "epoch": 19.760388739946382, "percentage": 98.8, "elapsed_time": "4:38:30", "remaining_time": "0:03:22", "throughput": 4090.81, "total_tokens": 68358488} +{"current_steps": 117935, "total_steps": 119360, "loss": 0.4265, "lr": 4.347236057051785e-09, "epoch": 19.76122654155496, "percentage": 98.81, "elapsed_time": "4:38:30", "remaining_time": "0:03:21", "throughput": 4090.81, "total_tokens": 68361240} +{"current_steps": 117940, "total_steps": 119360, "loss": 0.2359, "lr": 4.316808356319424e-09, "epoch": 19.762064343163537, "percentage": 98.81, "elapsed_time": "4:38:31", "remaining_time": "0:03:21", "throughput": 4090.82, "total_tokens": 68363960} +{"current_steps": 117945, "total_steps": 119360, "loss": 0.3228, "lr": 4.2864874705278445e-09, "epoch": 19.762902144772116, "percentage": 98.81, "elapsed_time": "4:38:32", "remaining_time": "0:03:20", "throughput": 4090.82, "total_tokens": 68366744} +{"current_steps": 117950, "total_steps": 119360, "loss": 0.2598, "lr": 4.256273400325417e-09, "epoch": 19.763739946380696, "percentage": 98.82, "elapsed_time": "4:38:32", "remaining_time": "0:03:19", "throughput": 4090.84, "total_tokens": 68369848} +{"current_steps": 117955, "total_steps": 119360, "loss": 0.3071, "lr": 4.226166146357735e-09, "epoch": 19.764577747989275, "percentage": 98.82, "elapsed_time": "4:38:33", "remaining_time": "0:03:19", "throughput": 4090.85, "total_tokens": 68372600} +{"current_steps": 117960, "total_steps": 119360, "loss": 0.2504, "lr": 4.196165709268729e-09, "epoch": 19.765415549597854, "percentage": 98.83, "elapsed_time": "4:38:34", "remaining_time": "0:03:18", "throughput": 4090.85, "total_tokens": 68375256} +{"current_steps": 117965, "total_steps": 119360, "loss": 0.3459, "lr": 4.166272089699552e-09, "epoch": 19.766253351206434, "percentage": 98.83, "elapsed_time": "4:38:34", "remaining_time": "0:03:17", "throughput": 4090.85, "total_tokens": 68377976} +{"current_steps": 117970, "total_steps": 119360, "loss": 0.528, "lr": 4.136485288290248e-09, "epoch": 19.767091152815013, "percentage": 98.84, "elapsed_time": "4:38:35", "remaining_time": "0:03:16", "throughput": 4090.86, "total_tokens": 68380792} +{"current_steps": 117975, "total_steps": 119360, "loss": 0.434, "lr": 4.10680530567642e-09, "epoch": 19.767928954423592, "percentage": 98.84, "elapsed_time": "4:38:36", "remaining_time": "0:03:16", "throughput": 4090.87, "total_tokens": 68383832} +{"current_steps": 117980, "total_steps": 119360, "loss": 0.2314, "lr": 4.07723214249367e-09, "epoch": 19.76876675603217, "percentage": 98.84, "elapsed_time": "4:38:36", "remaining_time": "0:03:15", "throughput": 4090.87, "total_tokens": 68386488} +{"current_steps": 117985, "total_steps": 119360, "loss": 0.2669, "lr": 4.04776579937427e-09, "epoch": 19.76960455764075, "percentage": 98.85, "elapsed_time": "4:38:37", "remaining_time": "0:03:14", "throughput": 4090.88, "total_tokens": 68389528} +{"current_steps": 117990, "total_steps": 119360, "loss": 0.4521, "lr": 4.0184062769477176e-09, "epoch": 19.77044235924933, "percentage": 98.85, "elapsed_time": "4:38:38", "remaining_time": "0:03:14", "throughput": 4090.89, "total_tokens": 68392312} +{"current_steps": 117995, "total_steps": 119360, "loss": 0.5432, "lr": 3.989153575842397e-09, "epoch": 19.77128016085791, "percentage": 98.86, "elapsed_time": "4:38:38", "remaining_time": "0:03:13", "throughput": 4090.9, "total_tokens": 68395128} +{"current_steps": 118000, "total_steps": 119360, "loss": 0.5941, "lr": 3.960007696682811e-09, "epoch": 19.77211796246649, "percentage": 98.86, "elapsed_time": "4:38:39", "remaining_time": "0:03:12", "throughput": 4090.9, "total_tokens": 68397720} +{"current_steps": 118005, "total_steps": 119360, "loss": 0.3077, "lr": 3.930968640092902e-09, "epoch": 19.772955764075068, "percentage": 98.86, "elapsed_time": "4:38:40", "remaining_time": "0:03:11", "throughput": 4090.91, "total_tokens": 68400952} +{"current_steps": 118010, "total_steps": 119360, "loss": 0.499, "lr": 3.902036406693843e-09, "epoch": 19.773793565683647, "percentage": 98.87, "elapsed_time": "4:38:40", "remaining_time": "0:03:11", "throughput": 4090.93, "total_tokens": 68404088} +{"current_steps": 118015, "total_steps": 119360, "loss": 0.2653, "lr": 3.873210997103471e-09, "epoch": 19.774631367292226, "percentage": 98.87, "elapsed_time": "4:38:41", "remaining_time": "0:03:10", "throughput": 4090.94, "total_tokens": 68407096} +{"current_steps": 118020, "total_steps": 119360, "loss": 0.3717, "lr": 3.844492411938516e-09, "epoch": 19.775469168900806, "percentage": 98.88, "elapsed_time": "4:38:42", "remaining_time": "0:03:09", "throughput": 4090.95, "total_tokens": 68410008} +{"current_steps": 118025, "total_steps": 119360, "loss": 0.3521, "lr": 3.815880651812931e-09, "epoch": 19.776306970509385, "percentage": 98.88, "elapsed_time": "4:38:43", "remaining_time": "0:03:09", "throughput": 4090.96, "total_tokens": 68413176} +{"current_steps": 118030, "total_steps": 119360, "loss": 0.4951, "lr": 3.7873757173384485e-09, "epoch": 19.777144772117964, "percentage": 98.89, "elapsed_time": "4:38:43", "remaining_time": "0:03:08", "throughput": 4090.97, "total_tokens": 68416024} +{"current_steps": 118035, "total_steps": 119360, "loss": 0.1832, "lr": 3.758977609124581e-09, "epoch": 19.77798257372654, "percentage": 98.89, "elapsed_time": "4:38:44", "remaining_time": "0:03:07", "throughput": 4090.99, "total_tokens": 68419288} +{"current_steps": 118040, "total_steps": 119360, "loss": 0.3366, "lr": 3.7306863277786206e-09, "epoch": 19.77882037533512, "percentage": 98.89, "elapsed_time": "4:38:45", "remaining_time": "0:03:07", "throughput": 4091.0, "total_tokens": 68422328} +{"current_steps": 118045, "total_steps": 119360, "loss": 0.3086, "lr": 3.7025018739056394e-09, "epoch": 19.7796581769437, "percentage": 98.9, "elapsed_time": "4:38:45", "remaining_time": "0:03:06", "throughput": 4091.02, "total_tokens": 68425656} +{"current_steps": 118050, "total_steps": 119360, "loss": 0.1531, "lr": 3.674424248107933e-09, "epoch": 19.780495978552278, "percentage": 98.9, "elapsed_time": "4:38:46", "remaining_time": "0:03:05", "throughput": 4091.03, "total_tokens": 68428536} +{"current_steps": 118055, "total_steps": 119360, "loss": 0.1429, "lr": 3.6464534509855764e-09, "epoch": 19.781333780160857, "percentage": 98.91, "elapsed_time": "4:38:47", "remaining_time": "0:03:04", "throughput": 4091.03, "total_tokens": 68431384} +{"current_steps": 118060, "total_steps": 119360, "loss": 0.2836, "lr": 3.6185894831375355e-09, "epoch": 19.782171581769436, "percentage": 98.91, "elapsed_time": "4:38:47", "remaining_time": "0:03:04", "throughput": 4091.03, "total_tokens": 68433944} +{"current_steps": 118065, "total_steps": 119360, "loss": 0.4478, "lr": 3.590832345158335e-09, "epoch": 19.783009383378015, "percentage": 98.92, "elapsed_time": "4:38:48", "remaining_time": "0:03:03", "throughput": 4091.04, "total_tokens": 68436664} +{"current_steps": 118070, "total_steps": 119360, "loss": 0.3601, "lr": 3.5631820376424985e-09, "epoch": 19.783847184986595, "percentage": 98.92, "elapsed_time": "4:38:49", "remaining_time": "0:03:02", "throughput": 4091.05, "total_tokens": 68439704} +{"current_steps": 118075, "total_steps": 119360, "loss": 0.4015, "lr": 3.5356385611812203e-09, "epoch": 19.784684986595174, "percentage": 98.92, "elapsed_time": "4:38:49", "remaining_time": "0:03:02", "throughput": 4091.06, "total_tokens": 68442712} +{"current_steps": 118080, "total_steps": 119360, "loss": 0.1652, "lr": 3.508201916362364e-09, "epoch": 19.785522788203753, "percentage": 98.93, "elapsed_time": "4:38:50", "remaining_time": "0:03:01", "throughput": 4091.07, "total_tokens": 68445720} +{"current_steps": 118085, "total_steps": 119360, "loss": 0.3189, "lr": 3.4808721037737916e-09, "epoch": 19.786360589812332, "percentage": 98.93, "elapsed_time": "4:38:51", "remaining_time": "0:03:00", "throughput": 4091.08, "total_tokens": 68448536} +{"current_steps": 118090, "total_steps": 119360, "loss": 0.2008, "lr": 3.453649123999481e-09, "epoch": 19.78719839142091, "percentage": 98.94, "elapsed_time": "4:38:51", "remaining_time": "0:02:59", "throughput": 4091.09, "total_tokens": 68451608} +{"current_steps": 118095, "total_steps": 119360, "loss": 0.3739, "lr": 3.426532977621189e-09, "epoch": 19.78803619302949, "percentage": 98.94, "elapsed_time": "4:38:52", "remaining_time": "0:02:59", "throughput": 4091.11, "total_tokens": 68454808} +{"current_steps": 118100, "total_steps": 119360, "loss": 0.1851, "lr": 3.3995236652184517e-09, "epoch": 19.78887399463807, "percentage": 98.94, "elapsed_time": "4:38:53", "remaining_time": "0:02:58", "throughput": 4091.11, "total_tokens": 68457752} +{"current_steps": 118105, "total_steps": 119360, "loss": 0.1777, "lr": 3.3726211873696955e-09, "epoch": 19.78971179624665, "percentage": 98.95, "elapsed_time": "4:38:53", "remaining_time": "0:02:57", "throughput": 4091.13, "total_tokens": 68460888} +{"current_steps": 118110, "total_steps": 119360, "loss": 0.0639, "lr": 3.3458255446494612e-09, "epoch": 19.79054959785523, "percentage": 98.95, "elapsed_time": "4:38:54", "remaining_time": "0:02:57", "throughput": 4091.14, "total_tokens": 68463992} +{"current_steps": 118115, "total_steps": 119360, "loss": 0.3714, "lr": 3.319136737631179e-09, "epoch": 19.791387399463808, "percentage": 98.96, "elapsed_time": "4:38:55", "remaining_time": "0:02:56", "throughput": 4091.15, "total_tokens": 68466776} +{"current_steps": 118120, "total_steps": 119360, "loss": 0.2624, "lr": 3.292554766884948e-09, "epoch": 19.792225201072387, "percentage": 98.96, "elapsed_time": "4:38:56", "remaining_time": "0:02:55", "throughput": 4091.15, "total_tokens": 68469752} +{"current_steps": 118125, "total_steps": 119360, "loss": 0.3525, "lr": 3.266079632979202e-09, "epoch": 19.793063002680967, "percentage": 98.97, "elapsed_time": "4:38:56", "remaining_time": "0:02:54", "throughput": 4091.16, "total_tokens": 68472600} +{"current_steps": 118130, "total_steps": 119360, "loss": 0.209, "lr": 3.2397113364801558e-09, "epoch": 19.793900804289546, "percentage": 98.97, "elapsed_time": "4:38:57", "remaining_time": "0:02:54", "throughput": 4091.17, "total_tokens": 68475384} +{"current_steps": 118135, "total_steps": 119360, "loss": 0.2642, "lr": 3.213449877951802e-09, "epoch": 19.79473860589812, "percentage": 98.97, "elapsed_time": "4:38:58", "remaining_time": "0:02:53", "throughput": 4091.17, "total_tokens": 68478168} +{"current_steps": 118140, "total_steps": 119360, "loss": 0.1393, "lr": 3.1872952579553583e-09, "epoch": 19.7955764075067, "percentage": 98.98, "elapsed_time": "4:38:58", "remaining_time": "0:02:52", "throughput": 4091.18, "total_tokens": 68480984} +{"current_steps": 118145, "total_steps": 119360, "loss": 0.3709, "lr": 3.1612474770498227e-09, "epoch": 19.79641420911528, "percentage": 98.98, "elapsed_time": "4:38:59", "remaining_time": "0:02:52", "throughput": 4091.19, "total_tokens": 68483864} +{"current_steps": 118150, "total_steps": 119360, "loss": 0.3459, "lr": 3.1353065357930813e-09, "epoch": 19.79725201072386, "percentage": 98.99, "elapsed_time": "4:39:00", "remaining_time": "0:02:51", "throughput": 4091.2, "total_tokens": 68487096} +{"current_steps": 118155, "total_steps": 119360, "loss": 0.1659, "lr": 3.1094724347385805e-09, "epoch": 19.79808981233244, "percentage": 98.99, "elapsed_time": "4:39:00", "remaining_time": "0:02:50", "throughput": 4091.21, "total_tokens": 68490008} +{"current_steps": 118160, "total_steps": 119360, "loss": 0.2708, "lr": 3.0837451744397675e-09, "epoch": 19.798927613941018, "percentage": 98.99, "elapsed_time": "4:39:01", "remaining_time": "0:02:50", "throughput": 4091.22, "total_tokens": 68492824} +{"current_steps": 118165, "total_steps": 119360, "loss": 0.2083, "lr": 3.058124755445646e-09, "epoch": 19.799765415549597, "percentage": 99.0, "elapsed_time": "4:39:02", "remaining_time": "0:02:49", "throughput": 4091.23, "total_tokens": 68496088} +{"current_steps": 118170, "total_steps": 119360, "loss": 0.2151, "lr": 3.0326111783052225e-09, "epoch": 19.800603217158177, "percentage": 99.0, "elapsed_time": "4:39:02", "remaining_time": "0:02:48", "throughput": 4091.24, "total_tokens": 68499224} +{"current_steps": 118175, "total_steps": 119360, "loss": 0.1869, "lr": 3.007204443563061e-09, "epoch": 19.801441018766756, "percentage": 99.01, "elapsed_time": "4:39:03", "remaining_time": "0:02:47", "throughput": 4091.25, "total_tokens": 68502328} +{"current_steps": 118180, "total_steps": 119360, "loss": 0.506, "lr": 2.9819045517626156e-09, "epoch": 19.802278820375335, "percentage": 99.01, "elapsed_time": "4:39:04", "remaining_time": "0:02:47", "throughput": 4091.26, "total_tokens": 68505048} +{"current_steps": 118185, "total_steps": 119360, "loss": 0.4561, "lr": 2.95671150344512e-09, "epoch": 19.803116621983914, "percentage": 99.02, "elapsed_time": "4:39:04", "remaining_time": "0:02:46", "throughput": 4091.26, "total_tokens": 68507800} +{"current_steps": 118190, "total_steps": 119360, "loss": 0.1379, "lr": 2.9316252991490325e-09, "epoch": 19.803954423592494, "percentage": 99.02, "elapsed_time": "4:39:05", "remaining_time": "0:02:45", "throughput": 4091.26, "total_tokens": 68510456} +{"current_steps": 118195, "total_steps": 119360, "loss": 0.3914, "lr": 2.9066459394111456e-09, "epoch": 19.804792225201073, "percentage": 99.02, "elapsed_time": "4:39:06", "remaining_time": "0:02:45", "throughput": 4091.27, "total_tokens": 68513240} +{"current_steps": 118200, "total_steps": 119360, "loss": 0.4592, "lr": 2.8817734247643668e-09, "epoch": 19.805630026809652, "percentage": 99.03, "elapsed_time": "4:39:06", "remaining_time": "0:02:44", "throughput": 4091.29, "total_tokens": 68516344} +{"current_steps": 118205, "total_steps": 119360, "loss": 0.4246, "lr": 2.8570077557421583e-09, "epoch": 19.80646782841823, "percentage": 99.03, "elapsed_time": "4:39:07", "remaining_time": "0:02:43", "throughput": 4091.29, "total_tokens": 68519352} +{"current_steps": 118210, "total_steps": 119360, "loss": 0.4941, "lr": 2.8323489328729857e-09, "epoch": 19.80730563002681, "percentage": 99.04, "elapsed_time": "4:39:08", "remaining_time": "0:02:42", "throughput": 4091.3, "total_tokens": 68522104} +{"current_steps": 118215, "total_steps": 119360, "loss": 0.2601, "lr": 2.8077969566842054e-09, "epoch": 19.80814343163539, "percentage": 99.04, "elapsed_time": "4:39:08", "remaining_time": "0:02:42", "throughput": 4091.31, "total_tokens": 68524952} +{"current_steps": 118220, "total_steps": 119360, "loss": 0.3853, "lr": 2.7833518277003978e-09, "epoch": 19.80898123324397, "percentage": 99.04, "elapsed_time": "4:39:09", "remaining_time": "0:02:41", "throughput": 4091.31, "total_tokens": 68527896} +{"current_steps": 118225, "total_steps": 119360, "loss": 0.5682, "lr": 2.7590135464450328e-09, "epoch": 19.80981903485255, "percentage": 99.05, "elapsed_time": "4:39:10", "remaining_time": "0:02:40", "throughput": 4091.33, "total_tokens": 68530904} +{"current_steps": 118230, "total_steps": 119360, "loss": 0.1352, "lr": 2.7347821134382503e-09, "epoch": 19.810656836461128, "percentage": 99.05, "elapsed_time": "4:39:11", "remaining_time": "0:02:40", "throughput": 4091.34, "total_tokens": 68534200} +{"current_steps": 118235, "total_steps": 119360, "loss": 0.2219, "lr": 2.710657529198524e-09, "epoch": 19.811494638069703, "percentage": 99.06, "elapsed_time": "4:39:11", "remaining_time": "0:02:39", "throughput": 4091.35, "total_tokens": 68537304} +{"current_steps": 118240, "total_steps": 119360, "loss": 0.2556, "lr": 2.686639794240442e-09, "epoch": 19.812332439678283, "percentage": 99.06, "elapsed_time": "4:39:12", "remaining_time": "0:02:38", "throughput": 4091.35, "total_tokens": 68539928} +{"current_steps": 118245, "total_steps": 119360, "loss": 0.4124, "lr": 2.6627289090791485e-09, "epoch": 19.813170241286862, "percentage": 99.07, "elapsed_time": "4:39:13", "remaining_time": "0:02:37", "throughput": 4091.36, "total_tokens": 68542840} +{"current_steps": 118250, "total_steps": 119360, "loss": 0.2347, "lr": 2.638924874224236e-09, "epoch": 19.81400804289544, "percentage": 99.07, "elapsed_time": "4:39:13", "remaining_time": "0:02:37", "throughput": 4091.38, "total_tokens": 68545944} +{"current_steps": 118255, "total_steps": 119360, "loss": 0.1936, "lr": 2.615227690186406e-09, "epoch": 19.81484584450402, "percentage": 99.07, "elapsed_time": "4:39:14", "remaining_time": "0:02:36", "throughput": 4091.38, "total_tokens": 68548792} +{"current_steps": 118260, "total_steps": 119360, "loss": 0.6835, "lr": 2.591637357470811e-09, "epoch": 19.8156836461126, "percentage": 99.08, "elapsed_time": "4:39:15", "remaining_time": "0:02:35", "throughput": 4091.39, "total_tokens": 68551640} +{"current_steps": 118265, "total_steps": 119360, "loss": 0.3275, "lr": 2.568153876582602e-09, "epoch": 19.81652144772118, "percentage": 99.08, "elapsed_time": "4:39:15", "remaining_time": "0:02:35", "throughput": 4091.4, "total_tokens": 68554360} +{"current_steps": 118270, "total_steps": 119360, "loss": 0.3287, "lr": 2.5447772480236e-09, "epoch": 19.81735924932976, "percentage": 99.09, "elapsed_time": "4:39:16", "remaining_time": "0:02:34", "throughput": 4091.41, "total_tokens": 68557336} +{"current_steps": 118275, "total_steps": 119360, "loss": 0.317, "lr": 2.5215074722939604e-09, "epoch": 19.818197050938338, "percentage": 99.09, "elapsed_time": "4:39:17", "remaining_time": "0:02:33", "throughput": 4091.42, "total_tokens": 68560184} +{"current_steps": 118280, "total_steps": 119360, "loss": 0.3871, "lr": 2.498344549891063e-09, "epoch": 19.819034852546917, "percentage": 99.1, "elapsed_time": "4:39:17", "remaining_time": "0:02:33", "throughput": 4091.42, "total_tokens": 68562840} +{"current_steps": 118285, "total_steps": 119360, "loss": 0.3392, "lr": 2.4752884813100674e-09, "epoch": 19.819872654155496, "percentage": 99.1, "elapsed_time": "4:39:18", "remaining_time": "0:02:32", "throughput": 4091.43, "total_tokens": 68565624} +{"current_steps": 118290, "total_steps": 119360, "loss": 0.506, "lr": 2.4523392670439126e-09, "epoch": 19.820710455764075, "percentage": 99.1, "elapsed_time": "4:39:19", "remaining_time": "0:02:31", "throughput": 4091.44, "total_tokens": 68568760} +{"current_steps": 118295, "total_steps": 119360, "loss": 0.3535, "lr": 2.4294969075838725e-09, "epoch": 19.821548257372655, "percentage": 99.11, "elapsed_time": "4:39:19", "remaining_time": "0:02:30", "throughput": 4091.45, "total_tokens": 68571832} +{"current_steps": 118300, "total_steps": 119360, "loss": 0.5638, "lr": 2.4067614034173347e-09, "epoch": 19.822386058981234, "percentage": 99.11, "elapsed_time": "4:39:20", "remaining_time": "0:02:30", "throughput": 4091.47, "total_tokens": 68575032} +{"current_steps": 118305, "total_steps": 119360, "loss": 0.2451, "lr": 2.3841327550311323e-09, "epoch": 19.823223860589813, "percentage": 99.12, "elapsed_time": "4:39:21", "remaining_time": "0:02:29", "throughput": 4091.47, "total_tokens": 68577816} +{"current_steps": 118310, "total_steps": 119360, "loss": 0.2658, "lr": 2.361610962909322e-09, "epoch": 19.824061662198392, "percentage": 99.12, "elapsed_time": "4:39:21", "remaining_time": "0:02:28", "throughput": 4091.48, "total_tokens": 68580696} +{"current_steps": 118315, "total_steps": 119360, "loss": 0.3021, "lr": 2.339196027532631e-09, "epoch": 19.82489946380697, "percentage": 99.12, "elapsed_time": "4:39:22", "remaining_time": "0:02:28", "throughput": 4091.49, "total_tokens": 68583608} +{"current_steps": 118320, "total_steps": 119360, "loss": 0.6268, "lr": 2.31688794938123e-09, "epoch": 19.82573726541555, "percentage": 99.13, "elapsed_time": "4:39:23", "remaining_time": "0:02:27", "throughput": 4091.5, "total_tokens": 68586808} +{"current_steps": 118325, "total_steps": 119360, "loss": 0.2652, "lr": 2.2946867289308506e-09, "epoch": 19.82657506702413, "percentage": 99.13, "elapsed_time": "4:39:23", "remaining_time": "0:02:26", "throughput": 4091.5, "total_tokens": 68589560} +{"current_steps": 118330, "total_steps": 119360, "loss": 0.1856, "lr": 2.2725923666577775e-09, "epoch": 19.827412868632706, "percentage": 99.14, "elapsed_time": "4:39:24", "remaining_time": "0:02:25", "throughput": 4091.52, "total_tokens": 68592856} +{"current_steps": 118335, "total_steps": 119360, "loss": 0.0914, "lr": 2.250604863033301e-09, "epoch": 19.828250670241285, "percentage": 99.14, "elapsed_time": "4:39:25", "remaining_time": "0:02:25", "throughput": 4091.52, "total_tokens": 68595704} +{"current_steps": 118340, "total_steps": 119360, "loss": 0.3739, "lr": 2.2287242185276002e-09, "epoch": 19.829088471849865, "percentage": 99.15, "elapsed_time": "4:39:26", "remaining_time": "0:02:24", "throughput": 4091.54, "total_tokens": 68598776} +{"current_steps": 118345, "total_steps": 119360, "loss": 0.645, "lr": 2.2069504336091898e-09, "epoch": 19.829926273458444, "percentage": 99.15, "elapsed_time": "4:39:26", "remaining_time": "0:02:23", "throughput": 4091.55, "total_tokens": 68601720} +{"current_steps": 118350, "total_steps": 119360, "loss": 0.4514, "lr": 2.1852835087426973e-09, "epoch": 19.830764075067023, "percentage": 99.15, "elapsed_time": "4:39:27", "remaining_time": "0:02:23", "throughput": 4091.55, "total_tokens": 68604408} +{"current_steps": 118355, "total_steps": 119360, "loss": 0.5045, "lr": 2.1637234443921964e-09, "epoch": 19.831601876675602, "percentage": 99.16, "elapsed_time": "4:39:27", "remaining_time": "0:02:22", "throughput": 4091.56, "total_tokens": 68607256} +{"current_steps": 118360, "total_steps": 119360, "loss": 0.1224, "lr": 2.1422702410184294e-09, "epoch": 19.83243967828418, "percentage": 99.16, "elapsed_time": "4:39:28", "remaining_time": "0:02:21", "throughput": 4091.56, "total_tokens": 68610008} +{"current_steps": 118365, "total_steps": 119360, "loss": 0.3262, "lr": 2.1209238990799185e-09, "epoch": 19.83327747989276, "percentage": 99.17, "elapsed_time": "4:39:29", "remaining_time": "0:02:20", "throughput": 4091.57, "total_tokens": 68612888} +{"current_steps": 118370, "total_steps": 119360, "loss": 0.3882, "lr": 2.0996844190335207e-09, "epoch": 19.83411528150134, "percentage": 99.17, "elapsed_time": "4:39:29", "remaining_time": "0:02:20", "throughput": 4091.59, "total_tokens": 68615800} +{"current_steps": 118375, "total_steps": 119360, "loss": 0.4437, "lr": 2.0785518013327623e-09, "epoch": 19.83495308310992, "percentage": 99.17, "elapsed_time": "4:39:30", "remaining_time": "0:02:19", "throughput": 4091.59, "total_tokens": 68618616} +{"current_steps": 118380, "total_steps": 119360, "loss": 0.4991, "lr": 2.0575260464295034e-09, "epoch": 19.8357908847185, "percentage": 99.18, "elapsed_time": "4:39:31", "remaining_time": "0:02:18", "throughput": 4091.6, "total_tokens": 68621432} +{"current_steps": 118385, "total_steps": 119360, "loss": 0.2274, "lr": 2.0366071547739397e-09, "epoch": 19.836628686327078, "percentage": 99.18, "elapsed_time": "4:39:31", "remaining_time": "0:02:18", "throughput": 4091.61, "total_tokens": 68624280} +{"current_steps": 118390, "total_steps": 119360, "loss": 0.4117, "lr": 2.015795126812936e-09, "epoch": 19.837466487935657, "percentage": 99.19, "elapsed_time": "4:39:32", "remaining_time": "0:02:17", "throughput": 4091.62, "total_tokens": 68627384} +{"current_steps": 118395, "total_steps": 119360, "loss": 0.3557, "lr": 1.995089962991692e-09, "epoch": 19.838304289544237, "percentage": 99.19, "elapsed_time": "4:39:33", "remaining_time": "0:02:16", "throughput": 4091.63, "total_tokens": 68630264} +{"current_steps": 118400, "total_steps": 119360, "loss": 0.1518, "lr": 1.974491663752076e-09, "epoch": 19.839142091152816, "percentage": 99.2, "elapsed_time": "4:39:34", "remaining_time": "0:02:16", "throughput": 4091.64, "total_tokens": 68633464} +{"current_steps": 118405, "total_steps": 119360, "loss": 0.3545, "lr": 1.954000229535957e-09, "epoch": 19.839979892761395, "percentage": 99.2, "elapsed_time": "4:39:34", "remaining_time": "0:02:15", "throughput": 4091.65, "total_tokens": 68636376} +{"current_steps": 118410, "total_steps": 119360, "loss": 0.3694, "lr": 1.9336156607802082e-09, "epoch": 19.840817694369974, "percentage": 99.2, "elapsed_time": "4:39:35", "remaining_time": "0:02:14", "throughput": 4091.66, "total_tokens": 68639096} +{"current_steps": 118415, "total_steps": 119360, "loss": 0.1884, "lr": 1.9133379579211466e-09, "epoch": 19.841655495978554, "percentage": 99.21, "elapsed_time": "4:39:36", "remaining_time": "0:02:13", "throughput": 4091.66, "total_tokens": 68641976} +{"current_steps": 118420, "total_steps": 119360, "loss": 0.245, "lr": 1.893167121392869e-09, "epoch": 19.842493297587133, "percentage": 99.21, "elapsed_time": "4:39:36", "remaining_time": "0:02:13", "throughput": 4091.67, "total_tokens": 68644888} +{"current_steps": 118425, "total_steps": 119360, "loss": 0.4594, "lr": 1.873103151625588e-09, "epoch": 19.843331099195712, "percentage": 99.22, "elapsed_time": "4:39:37", "remaining_time": "0:02:12", "throughput": 4091.68, "total_tokens": 68647608} +{"current_steps": 118430, "total_steps": 119360, "loss": 0.3177, "lr": 1.8531460490495146e-09, "epoch": 19.844168900804288, "percentage": 99.22, "elapsed_time": "4:39:38", "remaining_time": "0:02:11", "throughput": 4091.68, "total_tokens": 68650296} +{"current_steps": 118435, "total_steps": 119360, "loss": 0.1272, "lr": 1.833295814090419e-09, "epoch": 19.845006702412867, "percentage": 99.23, "elapsed_time": "4:39:38", "remaining_time": "0:02:11", "throughput": 4091.7, "total_tokens": 68653400} +{"current_steps": 118440, "total_steps": 119360, "loss": 0.3005, "lr": 1.8135524471729615e-09, "epoch": 19.845844504021446, "percentage": 99.23, "elapsed_time": "4:39:39", "remaining_time": "0:02:10", "throughput": 4091.7, "total_tokens": 68656088} +{"current_steps": 118445, "total_steps": 119360, "loss": 0.3484, "lr": 1.7939159487190272e-09, "epoch": 19.846682305630026, "percentage": 99.23, "elapsed_time": "4:39:40", "remaining_time": "0:02:09", "throughput": 4091.72, "total_tokens": 68659096} +{"current_steps": 118450, "total_steps": 119360, "loss": 0.1966, "lr": 1.7743863191493904e-09, "epoch": 19.847520107238605, "percentage": 99.24, "elapsed_time": "4:39:40", "remaining_time": "0:02:08", "throughput": 4091.73, "total_tokens": 68662488} +{"current_steps": 118455, "total_steps": 119360, "loss": 0.4325, "lr": 1.7549635588803848e-09, "epoch": 19.848357908847184, "percentage": 99.24, "elapsed_time": "4:39:41", "remaining_time": "0:02:08", "throughput": 4091.73, "total_tokens": 68665272} +{"current_steps": 118460, "total_steps": 119360, "loss": 0.2653, "lr": 1.7356476683283441e-09, "epoch": 19.849195710455763, "percentage": 99.25, "elapsed_time": "4:39:42", "remaining_time": "0:02:07", "throughput": 4091.74, "total_tokens": 68668152} +{"current_steps": 118465, "total_steps": 119360, "loss": 0.2658, "lr": 1.7164386479057161e-09, "epoch": 19.850033512064343, "percentage": 99.25, "elapsed_time": "4:39:42", "remaining_time": "0:02:06", "throughput": 4091.75, "total_tokens": 68670936} +{"current_steps": 118470, "total_steps": 119360, "loss": 0.2685, "lr": 1.6973364980232832e-09, "epoch": 19.850871313672922, "percentage": 99.25, "elapsed_time": "4:39:43", "remaining_time": "0:02:06", "throughput": 4091.76, "total_tokens": 68673976} +{"current_steps": 118475, "total_steps": 119360, "loss": 0.3722, "lr": 1.6783412190896076e-09, "epoch": 19.8517091152815, "percentage": 99.26, "elapsed_time": "4:39:44", "remaining_time": "0:02:05", "throughput": 4091.77, "total_tokens": 68676984} +{"current_steps": 118480, "total_steps": 119360, "loss": 0.4994, "lr": 1.6594528115110309e-09, "epoch": 19.85254691689008, "percentage": 99.26, "elapsed_time": "4:39:44", "remaining_time": "0:02:04", "throughput": 4091.77, "total_tokens": 68679736} +{"current_steps": 118485, "total_steps": 119360, "loss": 0.229, "lr": 1.6406712756911192e-09, "epoch": 19.85338471849866, "percentage": 99.27, "elapsed_time": "4:39:45", "remaining_time": "0:02:03", "throughput": 4091.79, "total_tokens": 68682744} +{"current_steps": 118490, "total_steps": 119360, "loss": 0.5198, "lr": 1.621996612031218e-09, "epoch": 19.85422252010724, "percentage": 99.27, "elapsed_time": "4:39:46", "remaining_time": "0:02:03", "throughput": 4091.79, "total_tokens": 68685528} +{"current_steps": 118495, "total_steps": 119360, "loss": 0.2938, "lr": 1.6034288209310077e-09, "epoch": 19.85506032171582, "percentage": 99.28, "elapsed_time": "4:39:46", "remaining_time": "0:02:02", "throughput": 4091.8, "total_tokens": 68688184} +{"current_steps": 118500, "total_steps": 119360, "loss": 0.3858, "lr": 1.5849679027873932e-09, "epoch": 19.855898123324398, "percentage": 99.28, "elapsed_time": "4:39:47", "remaining_time": "0:02:01", "throughput": 4091.81, "total_tokens": 68691032} +{"current_steps": 118505, "total_steps": 119360, "loss": 0.359, "lr": 1.5666138579950584e-09, "epoch": 19.856735924932977, "percentage": 99.28, "elapsed_time": "4:39:48", "remaining_time": "0:02:01", "throughput": 4091.82, "total_tokens": 68693752} +{"current_steps": 118510, "total_steps": 119360, "loss": 0.345, "lr": 1.5483666869464676e-09, "epoch": 19.857573726541556, "percentage": 99.29, "elapsed_time": "4:39:48", "remaining_time": "0:02:00", "throughput": 4091.83, "total_tokens": 68696664} +{"current_steps": 118515, "total_steps": 119360, "loss": 0.3649, "lr": 1.5302263900318637e-09, "epoch": 19.858411528150135, "percentage": 99.29, "elapsed_time": "4:39:49", "remaining_time": "0:01:59", "throughput": 4091.83, "total_tokens": 68699640} +{"current_steps": 118520, "total_steps": 119360, "loss": 0.2531, "lr": 1.5121929676392699e-09, "epoch": 19.859249329758715, "percentage": 99.3, "elapsed_time": "4:39:50", "remaining_time": "0:01:58", "throughput": 4091.84, "total_tokens": 68702392} +{"current_steps": 118525, "total_steps": 119360, "loss": 0.3652, "lr": 1.4942664201539336e-09, "epoch": 19.860087131367294, "percentage": 99.3, "elapsed_time": "4:39:50", "remaining_time": "0:01:58", "throughput": 4091.85, "total_tokens": 68705368} +{"current_steps": 118530, "total_steps": 119360, "loss": 0.391, "lr": 1.4764467479588818e-09, "epoch": 19.86092493297587, "percentage": 99.3, "elapsed_time": "4:39:51", "remaining_time": "0:01:57", "throughput": 4091.85, "total_tokens": 68708056} +{"current_steps": 118535, "total_steps": 119360, "loss": 0.193, "lr": 1.458733951435476e-09, "epoch": 19.86176273458445, "percentage": 99.31, "elapsed_time": "4:39:52", "remaining_time": "0:01:56", "throughput": 4091.87, "total_tokens": 68711128} +{"current_steps": 118540, "total_steps": 119360, "loss": 0.4031, "lr": 1.4411280309628573e-09, "epoch": 19.86260053619303, "percentage": 99.31, "elapsed_time": "4:39:52", "remaining_time": "0:01:56", "throughput": 4091.88, "total_tokens": 68713784} +{"current_steps": 118545, "total_steps": 119360, "loss": 0.2113, "lr": 1.4236289869168363e-09, "epoch": 19.863438337801608, "percentage": 99.32, "elapsed_time": "4:39:53", "remaining_time": "0:01:55", "throughput": 4091.88, "total_tokens": 68716632} +{"current_steps": 118550, "total_steps": 119360, "loss": 0.4692, "lr": 1.4062368196715582e-09, "epoch": 19.864276139410187, "percentage": 99.32, "elapsed_time": "4:39:54", "remaining_time": "0:01:54", "throughput": 4091.9, "total_tokens": 68719704} +{"current_steps": 118555, "total_steps": 119360, "loss": 0.5024, "lr": 1.3889515295989475e-09, "epoch": 19.865113941018766, "percentage": 99.33, "elapsed_time": "4:39:54", "remaining_time": "0:01:54", "throughput": 4091.9, "total_tokens": 68722456} +{"current_steps": 118560, "total_steps": 119360, "loss": 0.2917, "lr": 1.3717731170692639e-09, "epoch": 19.865951742627345, "percentage": 99.33, "elapsed_time": "4:39:55", "remaining_time": "0:01:53", "throughput": 4091.91, "total_tokens": 68725368} +{"current_steps": 118565, "total_steps": 119360, "loss": 0.3293, "lr": 1.3547015824494357e-09, "epoch": 19.866789544235925, "percentage": 99.33, "elapsed_time": "4:39:56", "remaining_time": "0:01:52", "throughput": 4091.92, "total_tokens": 68728024} +{"current_steps": 118570, "total_steps": 119360, "loss": 0.2257, "lr": 1.3377369261036165e-09, "epoch": 19.867627345844504, "percentage": 99.34, "elapsed_time": "4:39:56", "remaining_time": "0:01:51", "throughput": 4091.93, "total_tokens": 68731032} +{"current_steps": 118575, "total_steps": 119360, "loss": 0.3675, "lr": 1.3208791483959593e-09, "epoch": 19.868465147453083, "percentage": 99.34, "elapsed_time": "4:39:57", "remaining_time": "0:01:51", "throughput": 4091.93, "total_tokens": 68733976} +{"current_steps": 118580, "total_steps": 119360, "loss": 0.3496, "lr": 1.304128249685621e-09, "epoch": 19.869302949061662, "percentage": 99.35, "elapsed_time": "4:39:58", "remaining_time": "0:01:50", "throughput": 4091.94, "total_tokens": 68736696} +{"current_steps": 118585, "total_steps": 119360, "loss": 0.3774, "lr": 1.2874842303317592e-09, "epoch": 19.87014075067024, "percentage": 99.35, "elapsed_time": "4:39:58", "remaining_time": "0:01:49", "throughput": 4091.95, "total_tokens": 68739896} +{"current_steps": 118590, "total_steps": 119360, "loss": 0.3772, "lr": 1.2709470906896448e-09, "epoch": 19.87097855227882, "percentage": 99.35, "elapsed_time": "4:39:59", "remaining_time": "0:01:49", "throughput": 4091.96, "total_tokens": 68743064} +{"current_steps": 118595, "total_steps": 119360, "loss": 0.4135, "lr": 1.2545168311134391e-09, "epoch": 19.8718163538874, "percentage": 99.36, "elapsed_time": "4:40:00", "remaining_time": "0:01:48", "throughput": 4091.97, "total_tokens": 68746072} +{"current_steps": 118600, "total_steps": 119360, "loss": 0.2153, "lr": 1.238193451953973e-09, "epoch": 19.87265415549598, "percentage": 99.36, "elapsed_time": "4:40:01", "remaining_time": "0:01:47", "throughput": 4091.99, "total_tokens": 68749496} +{"current_steps": 118605, "total_steps": 119360, "loss": 0.2883, "lr": 1.2219769535598557e-09, "epoch": 19.87349195710456, "percentage": 99.37, "elapsed_time": "4:40:01", "remaining_time": "0:01:46", "throughput": 4091.99, "total_tokens": 68752248} +{"current_steps": 118610, "total_steps": 119360, "loss": 0.3131, "lr": 1.2058673362785877e-09, "epoch": 19.874329758713138, "percentage": 99.37, "elapsed_time": "4:40:02", "remaining_time": "0:01:46", "throughput": 4092.0, "total_tokens": 68754936} +{"current_steps": 118615, "total_steps": 119360, "loss": 0.3505, "lr": 1.189864600454338e-09, "epoch": 19.875167560321717, "percentage": 99.38, "elapsed_time": "4:40:03", "remaining_time": "0:01:45", "throughput": 4092.01, "total_tokens": 68758264} +{"current_steps": 118620, "total_steps": 119360, "loss": 0.2458, "lr": 1.1739687464296102e-09, "epoch": 19.876005361930297, "percentage": 99.38, "elapsed_time": "4:40:03", "remaining_time": "0:01:44", "throughput": 4092.02, "total_tokens": 68761112} +{"current_steps": 118625, "total_steps": 119360, "loss": 0.19, "lr": 1.1581797745435774e-09, "epoch": 19.876843163538872, "percentage": 99.38, "elapsed_time": "4:40:04", "remaining_time": "0:01:44", "throughput": 4092.03, "total_tokens": 68764024} +{"current_steps": 118630, "total_steps": 119360, "loss": 0.159, "lr": 1.1424976851343028e-09, "epoch": 19.87768096514745, "percentage": 99.39, "elapsed_time": "4:40:05", "remaining_time": "0:01:43", "throughput": 4092.04, "total_tokens": 68767000} +{"current_steps": 118635, "total_steps": 119360, "loss": 0.512, "lr": 1.1269224785370736e-09, "epoch": 19.87851876675603, "percentage": 99.39, "elapsed_time": "4:40:05", "remaining_time": "0:01:42", "throughput": 4092.05, "total_tokens": 68769976} +{"current_steps": 118640, "total_steps": 119360, "loss": 0.5003, "lr": 1.1114541550844015e-09, "epoch": 19.87935656836461, "percentage": 99.4, "elapsed_time": "4:40:06", "remaining_time": "0:01:41", "throughput": 4092.05, "total_tokens": 68772600} +{"current_steps": 118645, "total_steps": 119360, "loss": 0.4929, "lr": 1.0960927151082435e-09, "epoch": 19.88019436997319, "percentage": 99.4, "elapsed_time": "4:40:07", "remaining_time": "0:01:41", "throughput": 4092.06, "total_tokens": 68775288} +{"current_steps": 118650, "total_steps": 119360, "loss": 0.7018, "lr": 1.0808381589355598e-09, "epoch": 19.88103217158177, "percentage": 99.41, "elapsed_time": "4:40:07", "remaining_time": "0:01:40", "throughput": 4092.07, "total_tokens": 68778456} +{"current_steps": 118655, "total_steps": 119360, "loss": 0.2401, "lr": 1.0656904868933116e-09, "epoch": 19.881869973190348, "percentage": 99.41, "elapsed_time": "4:40:08", "remaining_time": "0:01:39", "throughput": 4092.08, "total_tokens": 68781688} +{"current_steps": 118660, "total_steps": 119360, "loss": 0.1458, "lr": 1.0506496993056836e-09, "epoch": 19.882707774798927, "percentage": 99.41, "elapsed_time": "4:40:09", "remaining_time": "0:01:39", "throughput": 4092.09, "total_tokens": 68784792} +{"current_steps": 118665, "total_steps": 119360, "loss": 0.625, "lr": 1.0357157964935304e-09, "epoch": 19.883545576407506, "percentage": 99.42, "elapsed_time": "4:40:09", "remaining_time": "0:01:38", "throughput": 4092.1, "total_tokens": 68788056} +{"current_steps": 118670, "total_steps": 119360, "loss": 0.4058, "lr": 1.0208887787760412e-09, "epoch": 19.884383378016086, "percentage": 99.42, "elapsed_time": "4:40:10", "remaining_time": "0:01:37", "throughput": 4092.11, "total_tokens": 68790808} +{"current_steps": 118675, "total_steps": 119360, "loss": 0.3595, "lr": 1.006168646471295e-09, "epoch": 19.885221179624665, "percentage": 99.43, "elapsed_time": "4:40:11", "remaining_time": "0:01:37", "throughput": 4092.11, "total_tokens": 68793432} +{"current_steps": 118680, "total_steps": 119360, "loss": 0.3782, "lr": 9.915553998934846e-10, "epoch": 19.886058981233244, "percentage": 99.43, "elapsed_time": "4:40:11", "remaining_time": "0:01:36", "throughput": 4092.11, "total_tokens": 68796248} +{"current_steps": 118685, "total_steps": 119360, "loss": 0.3587, "lr": 9.77049039354583e-10, "epoch": 19.886896782841823, "percentage": 99.43, "elapsed_time": "4:40:12", "remaining_time": "0:01:35", "throughput": 4092.13, "total_tokens": 68799352} +{"current_steps": 118690, "total_steps": 119360, "loss": 0.3212, "lr": 9.626495651654523e-10, "epoch": 19.887734584450403, "percentage": 99.44, "elapsed_time": "4:40:13", "remaining_time": "0:01:34", "throughput": 4092.13, "total_tokens": 68802040} +{"current_steps": 118695, "total_steps": 119360, "loss": 0.485, "lr": 9.483569776336243e-10, "epoch": 19.888572386058982, "percentage": 99.44, "elapsed_time": "4:40:13", "remaining_time": "0:01:34", "throughput": 4092.14, "total_tokens": 68804760} +{"current_steps": 118700, "total_steps": 119360, "loss": 0.5556, "lr": 9.341712770649657e-10, "epoch": 19.88941018766756, "percentage": 99.45, "elapsed_time": "4:40:14", "remaining_time": "0:01:33", "throughput": 4092.14, "total_tokens": 68807384} +{"current_steps": 118705, "total_steps": 119360, "loss": 0.4528, "lr": 9.200924637625675e-10, "epoch": 19.89024798927614, "percentage": 99.45, "elapsed_time": "4:40:15", "remaining_time": "0:01:32", "throughput": 4092.15, "total_tokens": 68810264} +{"current_steps": 118710, "total_steps": 119360, "loss": 0.1323, "lr": 9.061205380272998e-10, "epoch": 19.89108579088472, "percentage": 99.46, "elapsed_time": "4:40:15", "remaining_time": "0:01:32", "throughput": 4092.16, "total_tokens": 68813016} +{"current_steps": 118715, "total_steps": 119360, "loss": 0.338, "lr": 8.922555001578126e-10, "epoch": 19.8919235924933, "percentage": 99.46, "elapsed_time": "4:40:16", "remaining_time": "0:01:31", "throughput": 4092.17, "total_tokens": 68815960} +{"current_steps": 118720, "total_steps": 119360, "loss": 0.2945, "lr": 8.784973504510907e-10, "epoch": 19.89276139410188, "percentage": 99.46, "elapsed_time": "4:40:17", "remaining_time": "0:01:30", "throughput": 4092.17, "total_tokens": 68818648} +{"current_steps": 118725, "total_steps": 119360, "loss": 0.1681, "lr": 8.648460892013433e-10, "epoch": 19.893599195710454, "percentage": 99.47, "elapsed_time": "4:40:17", "remaining_time": "0:01:29", "throughput": 4092.18, "total_tokens": 68821560} +{"current_steps": 118730, "total_steps": 119360, "loss": 0.2018, "lr": 8.513017166994486e-10, "epoch": 19.894436997319033, "percentage": 99.47, "elapsed_time": "4:40:18", "remaining_time": "0:01:29", "throughput": 4092.19, "total_tokens": 68824536} +{"current_steps": 118735, "total_steps": 119360, "loss": 0.6018, "lr": 8.378642332362852e-10, "epoch": 19.895274798927613, "percentage": 99.48, "elapsed_time": "4:40:19", "remaining_time": "0:01:28", "throughput": 4092.2, "total_tokens": 68827448} +{"current_steps": 118740, "total_steps": 119360, "loss": 0.5027, "lr": 8.245336390982905e-10, "epoch": 19.896112600536192, "percentage": 99.48, "elapsed_time": "4:40:19", "remaining_time": "0:01:27", "throughput": 4092.22, "total_tokens": 68830904} +{"current_steps": 118745, "total_steps": 119360, "loss": 0.3139, "lr": 8.113099345713471e-10, "epoch": 19.89695040214477, "percentage": 99.48, "elapsed_time": "4:40:20", "remaining_time": "0:01:27", "throughput": 4092.22, "total_tokens": 68833624} +{"current_steps": 118750, "total_steps": 119360, "loss": 0.2413, "lr": 7.981931199368964e-10, "epoch": 19.89778820375335, "percentage": 99.49, "elapsed_time": "4:40:21", "remaining_time": "0:01:26", "throughput": 4092.24, "total_tokens": 68836664} +{"current_steps": 118755, "total_steps": 119360, "loss": 0.4301, "lr": 7.8518319547638e-10, "epoch": 19.89862600536193, "percentage": 99.49, "elapsed_time": "4:40:21", "remaining_time": "0:01:25", "throughput": 4092.25, "total_tokens": 68839544} +{"current_steps": 118760, "total_steps": 119360, "loss": 0.4396, "lr": 7.722801614679088e-10, "epoch": 19.89946380697051, "percentage": 99.5, "elapsed_time": "4:40:22", "remaining_time": "0:01:24", "throughput": 4092.26, "total_tokens": 68842584} +{"current_steps": 118765, "total_steps": 119360, "loss": 0.2955, "lr": 7.59484018187373e-10, "epoch": 19.90030160857909, "percentage": 99.5, "elapsed_time": "4:40:23", "remaining_time": "0:01:24", "throughput": 4092.27, "total_tokens": 68845464} +{"current_steps": 118770, "total_steps": 119360, "loss": 0.4421, "lr": 7.467947659073326e-10, "epoch": 19.901139410187668, "percentage": 99.51, "elapsed_time": "4:40:23", "remaining_time": "0:01:23", "throughput": 4092.28, "total_tokens": 68848312} +{"current_steps": 118775, "total_steps": 119360, "loss": 0.4442, "lr": 7.342124049009025e-10, "epoch": 19.901977211796247, "percentage": 99.51, "elapsed_time": "4:40:24", "remaining_time": "0:01:22", "throughput": 4092.29, "total_tokens": 68851384} +{"current_steps": 118780, "total_steps": 119360, "loss": 0.2643, "lr": 7.217369354356463e-10, "epoch": 19.902815013404826, "percentage": 99.51, "elapsed_time": "4:40:25", "remaining_time": "0:01:22", "throughput": 4092.29, "total_tokens": 68854008} +{"current_steps": 118785, "total_steps": 119360, "loss": 0.1953, "lr": 7.093683577791277e-10, "epoch": 19.903652815013405, "percentage": 99.52, "elapsed_time": "4:40:26", "remaining_time": "0:01:21", "throughput": 4092.31, "total_tokens": 68857304} +{"current_steps": 118790, "total_steps": 119360, "loss": 0.2412, "lr": 6.971066721950248e-10, "epoch": 19.904490616621985, "percentage": 99.52, "elapsed_time": "4:40:26", "remaining_time": "0:01:20", "throughput": 4092.32, "total_tokens": 68860152} +{"current_steps": 118795, "total_steps": 119360, "loss": 0.4519, "lr": 6.849518789464604e-10, "epoch": 19.905328418230564, "percentage": 99.53, "elapsed_time": "4:40:27", "remaining_time": "0:01:20", "throughput": 4092.33, "total_tokens": 68862904} +{"current_steps": 118800, "total_steps": 119360, "loss": 0.3965, "lr": 6.729039782926716e-10, "epoch": 19.906166219839143, "percentage": 99.53, "elapsed_time": "4:40:27", "remaining_time": "0:01:19", "throughput": 4092.33, "total_tokens": 68865624} +{"current_steps": 118805, "total_steps": 119360, "loss": 0.3022, "lr": 6.609629704912302e-10, "epoch": 19.907004021447722, "percentage": 99.54, "elapsed_time": "4:40:28", "remaining_time": "0:01:18", "throughput": 4092.34, "total_tokens": 68868600} +{"current_steps": 118810, "total_steps": 119360, "loss": 0.3187, "lr": 6.491288557980424e-10, "epoch": 19.9078418230563, "percentage": 99.54, "elapsed_time": "4:40:29", "remaining_time": "0:01:17", "throughput": 4092.35, "total_tokens": 68871512} +{"current_steps": 118815, "total_steps": 119360, "loss": 0.3089, "lr": 6.374016344656842e-10, "epoch": 19.90867962466488, "percentage": 99.54, "elapsed_time": "4:40:29", "remaining_time": "0:01:17", "throughput": 4092.36, "total_tokens": 68874328} +{"current_steps": 118820, "total_steps": 119360, "loss": 0.2804, "lr": 6.257813067450657e-10, "epoch": 19.90951742627346, "percentage": 99.55, "elapsed_time": "4:40:30", "remaining_time": "0:01:16", "throughput": 4092.37, "total_tokens": 68877656} +{"current_steps": 118825, "total_steps": 119360, "loss": 0.3372, "lr": 6.142678728843221e-10, "epoch": 19.910355227882036, "percentage": 99.55, "elapsed_time": "4:40:31", "remaining_time": "0:01:15", "throughput": 4092.39, "total_tokens": 68880536} +{"current_steps": 118830, "total_steps": 119360, "loss": 0.2262, "lr": 6.028613331299227e-10, "epoch": 19.911193029490615, "percentage": 99.56, "elapsed_time": "4:40:32", "remaining_time": "0:01:15", "throughput": 4092.4, "total_tokens": 68883672} +{"current_steps": 118835, "total_steps": 119360, "loss": 0.2412, "lr": 5.915616877255614e-10, "epoch": 19.912030831099194, "percentage": 99.56, "elapsed_time": "4:40:32", "remaining_time": "0:01:14", "throughput": 4092.4, "total_tokens": 68886296} +{"current_steps": 118840, "total_steps": 119360, "loss": 0.2198, "lr": 5.803689369127119e-10, "epoch": 19.912868632707774, "percentage": 99.56, "elapsed_time": "4:40:33", "remaining_time": "0:01:13", "throughput": 4092.4, "total_tokens": 68889016} +{"current_steps": 118845, "total_steps": 119360, "loss": 0.3127, "lr": 5.692830809317374e-10, "epoch": 19.913706434316353, "percentage": 99.57, "elapsed_time": "4:40:34", "remaining_time": "0:01:12", "throughput": 4092.4, "total_tokens": 68891672} +{"current_steps": 118850, "total_steps": 119360, "loss": 0.2246, "lr": 5.58304120018005e-10, "epoch": 19.914544235924932, "percentage": 99.57, "elapsed_time": "4:40:34", "remaining_time": "0:01:12", "throughput": 4092.41, "total_tokens": 68894616} +{"current_steps": 118855, "total_steps": 119360, "loss": 0.3134, "lr": 5.474320544079925e-10, "epoch": 19.91538203753351, "percentage": 99.58, "elapsed_time": "4:40:35", "remaining_time": "0:01:11", "throughput": 4092.41, "total_tokens": 68897336} +{"current_steps": 118860, "total_steps": 119360, "loss": 0.1659, "lr": 5.366668843326262e-10, "epoch": 19.91621983914209, "percentage": 99.58, "elapsed_time": "4:40:36", "remaining_time": "0:01:10", "throughput": 4092.42, "total_tokens": 68900152} +{"current_steps": 118865, "total_steps": 119360, "loss": 0.2341, "lr": 5.260086100233874e-10, "epoch": 19.91705764075067, "percentage": 99.59, "elapsed_time": "4:40:36", "remaining_time": "0:01:10", "throughput": 4092.42, "total_tokens": 68903032} +{"current_steps": 118870, "total_steps": 119360, "loss": 0.2685, "lr": 5.154572317067618e-10, "epoch": 19.91789544235925, "percentage": 99.59, "elapsed_time": "4:40:37", "remaining_time": "0:01:09", "throughput": 4092.43, "total_tokens": 68905816} +{"current_steps": 118875, "total_steps": 119360, "loss": 0.2149, "lr": 5.050127496097901e-10, "epoch": 19.91873324396783, "percentage": 99.59, "elapsed_time": "4:40:38", "remaining_time": "0:01:08", "throughput": 4092.44, "total_tokens": 68908504} +{"current_steps": 118880, "total_steps": 119360, "loss": 0.1926, "lr": 4.946751639550718e-10, "epoch": 19.919571045576408, "percentage": 99.6, "elapsed_time": "4:40:38", "remaining_time": "0:01:07", "throughput": 4092.45, "total_tokens": 68911800} +{"current_steps": 118885, "total_steps": 119360, "loss": 0.5696, "lr": 4.844444749635413e-10, "epoch": 19.920408847184987, "percentage": 99.6, "elapsed_time": "4:40:39", "remaining_time": "0:01:07", "throughput": 4092.46, "total_tokens": 68914744} +{"current_steps": 118890, "total_steps": 119360, "loss": 0.3046, "lr": 4.743206828539126e-10, "epoch": 19.921246648793566, "percentage": 99.61, "elapsed_time": "4:40:40", "remaining_time": "0:01:06", "throughput": 4092.46, "total_tokens": 68917432} +{"current_steps": 118895, "total_steps": 119360, "loss": 0.3364, "lr": 4.6430378784323436e-10, "epoch": 19.922084450402146, "percentage": 99.61, "elapsed_time": "4:40:40", "remaining_time": "0:01:05", "throughput": 4092.46, "total_tokens": 68920184} +{"current_steps": 118900, "total_steps": 119360, "loss": 0.2302, "lr": 4.5439379014466934e-10, "epoch": 19.922922252010725, "percentage": 99.61, "elapsed_time": "4:40:41", "remaining_time": "0:01:05", "throughput": 4092.48, "total_tokens": 68923224} +{"current_steps": 118905, "total_steps": 119360, "loss": 0.2652, "lr": 4.445906899713803e-10, "epoch": 19.923760053619304, "percentage": 99.62, "elapsed_time": "4:40:42", "remaining_time": "0:01:04", "throughput": 4092.5, "total_tokens": 68926392} +{"current_steps": 118910, "total_steps": 119360, "loss": 0.3016, "lr": 4.348944875320893e-10, "epoch": 19.924597855227884, "percentage": 99.62, "elapsed_time": "4:40:42", "remaining_time": "0:01:03", "throughput": 4092.51, "total_tokens": 68929272} +{"current_steps": 118915, "total_steps": 119360, "loss": 0.3851, "lr": 4.2530518303440794e-10, "epoch": 19.925435656836463, "percentage": 99.63, "elapsed_time": "4:40:43", "remaining_time": "0:01:03", "throughput": 4092.51, "total_tokens": 68932120} +{"current_steps": 118920, "total_steps": 119360, "loss": 0.2251, "lr": 4.158227766831724e-10, "epoch": 19.92627345844504, "percentage": 99.63, "elapsed_time": "4:40:44", "remaining_time": "0:01:02", "throughput": 4092.52, "total_tokens": 68935032} +{"current_steps": 118925, "total_steps": 119360, "loss": 0.6523, "lr": 4.064472686809984e-10, "epoch": 19.927111260053618, "percentage": 99.64, "elapsed_time": "4:40:44", "remaining_time": "0:01:01", "throughput": 4092.52, "total_tokens": 68937752} +{"current_steps": 118930, "total_steps": 119360, "loss": 0.3038, "lr": 3.9717865922883626e-10, "epoch": 19.927949061662197, "percentage": 99.64, "elapsed_time": "4:40:45", "remaining_time": "0:01:00", "throughput": 4092.53, "total_tokens": 68940600} +{"current_steps": 118935, "total_steps": 119360, "loss": 0.407, "lr": 3.880169485248608e-10, "epoch": 19.928786863270776, "percentage": 99.64, "elapsed_time": "4:40:46", "remaining_time": "0:01:00", "throughput": 4092.54, "total_tokens": 68943320} +{"current_steps": 118940, "total_steps": 119360, "loss": 0.5561, "lr": 3.7896213676447137e-10, "epoch": 19.929624664879356, "percentage": 99.65, "elapsed_time": "4:40:46", "remaining_time": "0:00:59", "throughput": 4092.55, "total_tokens": 68946328} +{"current_steps": 118945, "total_steps": 119360, "loss": 0.2773, "lr": 3.700142241414018e-10, "epoch": 19.930462466487935, "percentage": 99.65, "elapsed_time": "4:40:47", "remaining_time": "0:00:58", "throughput": 4092.56, "total_tokens": 68949176} +{"current_steps": 118950, "total_steps": 119360, "loss": 0.1465, "lr": 3.6117321084772063e-10, "epoch": 19.931300268096514, "percentage": 99.66, "elapsed_time": "4:40:48", "remaining_time": "0:00:58", "throughput": 4092.57, "total_tokens": 68952184} +{"current_steps": 118955, "total_steps": 119360, "loss": 0.3786, "lr": 3.5243909707161075e-10, "epoch": 19.932138069705093, "percentage": 99.66, "elapsed_time": "4:40:48", "remaining_time": "0:00:57", "throughput": 4092.57, "total_tokens": 68954840} +{"current_steps": 118960, "total_steps": 119360, "loss": 0.2403, "lr": 3.4381188299958957e-10, "epoch": 19.932975871313673, "percentage": 99.66, "elapsed_time": "4:40:49", "remaining_time": "0:00:56", "throughput": 4092.59, "total_tokens": 68957880} +{"current_steps": 118965, "total_steps": 119360, "loss": 0.2911, "lr": 3.3529156881706436e-10, "epoch": 19.933813672922252, "percentage": 99.67, "elapsed_time": "4:40:50", "remaining_time": "0:00:55", "throughput": 4092.59, "total_tokens": 68960696} +{"current_steps": 118970, "total_steps": 119360, "loss": 0.2358, "lr": 3.268781547055566e-10, "epoch": 19.93465147453083, "percentage": 99.67, "elapsed_time": "4:40:50", "remaining_time": "0:00:55", "throughput": 4092.59, "total_tokens": 68963416} +{"current_steps": 118975, "total_steps": 119360, "loss": 0.1573, "lr": 3.1857164084492243e-10, "epoch": 19.93548927613941, "percentage": 99.68, "elapsed_time": "4:40:51", "remaining_time": "0:00:54", "throughput": 4092.6, "total_tokens": 68966168} +{"current_steps": 118980, "total_steps": 119360, "loss": 0.4959, "lr": 3.103720274133526e-10, "epoch": 19.93632707774799, "percentage": 99.68, "elapsed_time": "4:40:52", "remaining_time": "0:00:53", "throughput": 4092.61, "total_tokens": 68968888} +{"current_steps": 118985, "total_steps": 119360, "loss": 0.1991, "lr": 3.022793145857073e-10, "epoch": 19.93716487935657, "percentage": 99.69, "elapsed_time": "4:40:52", "remaining_time": "0:00:53", "throughput": 4092.61, "total_tokens": 68971864} +{"current_steps": 118990, "total_steps": 119360, "loss": 0.3011, "lr": 2.942935025351812e-10, "epoch": 19.93800268096515, "percentage": 99.69, "elapsed_time": "4:40:53", "remaining_time": "0:00:52", "throughput": 4092.62, "total_tokens": 68974776} +{"current_steps": 118995, "total_steps": 119360, "loss": 0.2692, "lr": 2.864145914321936e-10, "epoch": 19.938840482573728, "percentage": 99.69, "elapsed_time": "4:40:54", "remaining_time": "0:00:51", "throughput": 4092.63, "total_tokens": 68977816} +{"current_steps": 119000, "total_steps": 119360, "loss": 0.2675, "lr": 2.786425814454985e-10, "epoch": 19.939678284182307, "percentage": 99.7, "elapsed_time": "4:40:54", "remaining_time": "0:00:50", "throughput": 4092.64, "total_tokens": 68980760} +{"current_steps": 119005, "total_steps": 119360, "loss": 0.6189, "lr": 2.709774727416292e-10, "epoch": 19.940516085790886, "percentage": 99.7, "elapsed_time": "4:40:55", "remaining_time": "0:00:50", "throughput": 4092.65, "total_tokens": 68983800} +{"current_steps": 119010, "total_steps": 119360, "loss": 0.6796, "lr": 2.634192654837886e-10, "epoch": 19.941353887399465, "percentage": 99.71, "elapsed_time": "4:40:56", "remaining_time": "0:00:49", "throughput": 4092.66, "total_tokens": 68986488} +{"current_steps": 119015, "total_steps": 119360, "loss": 0.3424, "lr": 2.559679598340692e-10, "epoch": 19.94219168900804, "percentage": 99.71, "elapsed_time": "4:40:56", "remaining_time": "0:00:48", "throughput": 4092.67, "total_tokens": 68989560} +{"current_steps": 119020, "total_steps": 119360, "loss": 0.252, "lr": 2.4862355595123287e-10, "epoch": 19.94302949061662, "percentage": 99.72, "elapsed_time": "4:40:57", "remaining_time": "0:00:48", "throughput": 4092.68, "total_tokens": 68992600} +{"current_steps": 119025, "total_steps": 119360, "loss": 0.2994, "lr": 2.4138605399293137e-10, "epoch": 19.9438672922252, "percentage": 99.72, "elapsed_time": "4:40:58", "remaining_time": "0:00:47", "throughput": 4092.69, "total_tokens": 68995544} +{"current_steps": 119030, "total_steps": 119360, "loss": 0.2563, "lr": 2.342554541134856e-10, "epoch": 19.94470509383378, "percentage": 99.72, "elapsed_time": "4:40:58", "remaining_time": "0:00:46", "throughput": 4092.7, "total_tokens": 68998456} +{"current_steps": 119035, "total_steps": 119360, "loss": 0.4362, "lr": 2.272317564655513e-10, "epoch": 19.945542895442358, "percentage": 99.73, "elapsed_time": "4:40:59", "remaining_time": "0:00:46", "throughput": 4092.71, "total_tokens": 69001368} +{"current_steps": 119040, "total_steps": 119360, "loss": 0.0955, "lr": 2.2031496119956363e-10, "epoch": 19.946380697050937, "percentage": 99.73, "elapsed_time": "4:41:00", "remaining_time": "0:00:45", "throughput": 4092.71, "total_tokens": 69004056} +{"current_steps": 119045, "total_steps": 119360, "loss": 0.2207, "lr": 2.135050684631823e-10, "epoch": 19.947218498659517, "percentage": 99.74, "elapsed_time": "4:41:00", "remaining_time": "0:00:44", "throughput": 4092.72, "total_tokens": 69007288} +{"current_steps": 119050, "total_steps": 119360, "loss": 0.4191, "lr": 2.068020784012914e-10, "epoch": 19.948056300268096, "percentage": 99.74, "elapsed_time": "4:41:01", "remaining_time": "0:00:43", "throughput": 4092.73, "total_tokens": 69010040} +{"current_steps": 119055, "total_steps": 119360, "loss": 0.3012, "lr": 2.0020599115877504e-10, "epoch": 19.948894101876675, "percentage": 99.74, "elapsed_time": "4:41:02", "remaining_time": "0:00:43", "throughput": 4092.74, "total_tokens": 69013080} +{"current_steps": 119060, "total_steps": 119360, "loss": 0.2944, "lr": 1.937168068749662e-10, "epoch": 19.949731903485254, "percentage": 99.75, "elapsed_time": "4:41:03", "remaining_time": "0:00:42", "throughput": 4092.74, "total_tokens": 69016024} +{"current_steps": 119065, "total_steps": 119360, "loss": 0.3105, "lr": 1.8733452569030808e-10, "epoch": 19.950569705093834, "percentage": 99.75, "elapsed_time": "4:41:03", "remaining_time": "0:00:41", "throughput": 4092.76, "total_tokens": 69018904} +{"current_steps": 119070, "total_steps": 119360, "loss": 0.1909, "lr": 1.810591477396928e-10, "epoch": 19.951407506702413, "percentage": 99.76, "elapsed_time": "4:41:04", "remaining_time": "0:00:41", "throughput": 4092.76, "total_tokens": 69021624} +{"current_steps": 119075, "total_steps": 119360, "loss": 0.6214, "lr": 1.7489067315801246e-10, "epoch": 19.952245308310992, "percentage": 99.76, "elapsed_time": "4:41:05", "remaining_time": "0:00:40", "throughput": 4092.78, "total_tokens": 69024824} +{"current_steps": 119080, "total_steps": 119360, "loss": 0.2799, "lr": 1.6882910207738356e-10, "epoch": 19.95308310991957, "percentage": 99.77, "elapsed_time": "4:41:05", "remaining_time": "0:00:39", "throughput": 4092.79, "total_tokens": 69027928} +{"current_steps": 119085, "total_steps": 119360, "loss": 0.5445, "lr": 1.6287443462714713e-10, "epoch": 19.95392091152815, "percentage": 99.77, "elapsed_time": "4:41:06", "remaining_time": "0:00:38", "throughput": 4092.79, "total_tokens": 69030648} +{"current_steps": 119090, "total_steps": 119360, "loss": 0.257, "lr": 1.570266709344237e-10, "epoch": 19.95475871313673, "percentage": 99.77, "elapsed_time": "4:41:07", "remaining_time": "0:00:38", "throughput": 4092.8, "total_tokens": 69033592} +{"current_steps": 119095, "total_steps": 119360, "loss": 0.3007, "lr": 1.5128581112466844e-10, "epoch": 19.95559651474531, "percentage": 99.78, "elapsed_time": "4:41:07", "remaining_time": "0:00:37", "throughput": 4092.8, "total_tokens": 69036568} +{"current_steps": 119100, "total_steps": 119360, "loss": 0.353, "lr": 1.4565185532056103e-10, "epoch": 19.95643431635389, "percentage": 99.78, "elapsed_time": "4:41:08", "remaining_time": "0:00:36", "throughput": 4092.81, "total_tokens": 69039448} +{"current_steps": 119105, "total_steps": 119360, "loss": 0.4566, "lr": 1.4012480364200555e-10, "epoch": 19.957272117962468, "percentage": 99.79, "elapsed_time": "4:41:09", "remaining_time": "0:00:36", "throughput": 4092.81, "total_tokens": 69042232} +{"current_steps": 119110, "total_steps": 119360, "loss": 0.224, "lr": 1.3470465620779582e-10, "epoch": 19.958109919571047, "percentage": 99.79, "elapsed_time": "4:41:09", "remaining_time": "0:00:35", "throughput": 4092.83, "total_tokens": 69045304} +{"current_steps": 119115, "total_steps": 119360, "loss": 0.4068, "lr": 1.293914131339502e-10, "epoch": 19.958947721179626, "percentage": 99.79, "elapsed_time": "4:41:10", "remaining_time": "0:00:34", "throughput": 4092.84, "total_tokens": 69048344} +{"current_steps": 119120, "total_steps": 119360, "loss": 0.2249, "lr": 1.2418507453315632e-10, "epoch": 19.959785522788202, "percentage": 99.8, "elapsed_time": "4:41:11", "remaining_time": "0:00:33", "throughput": 4092.84, "total_tokens": 69051032} +{"current_steps": 119125, "total_steps": 119360, "loss": 0.4014, "lr": 1.1908564051754668e-10, "epoch": 19.96062332439678, "percentage": 99.8, "elapsed_time": "4:41:11", "remaining_time": "0:00:33", "throughput": 4092.85, "total_tokens": 69053944} +{"current_steps": 119130, "total_steps": 119360, "loss": 0.3188, "lr": 1.1409311119592314e-10, "epoch": 19.96146112600536, "percentage": 99.81, "elapsed_time": "4:41:12", "remaining_time": "0:00:32", "throughput": 4092.86, "total_tokens": 69056984} +{"current_steps": 119135, "total_steps": 119360, "loss": 0.3815, "lr": 1.0920748667542224e-10, "epoch": 19.96229892761394, "percentage": 99.81, "elapsed_time": "4:41:13", "remaining_time": "0:00:31", "throughput": 4092.87, "total_tokens": 69059928} +{"current_steps": 119140, "total_steps": 119360, "loss": 0.3275, "lr": 1.0442876705984984e-10, "epoch": 19.96313672922252, "percentage": 99.82, "elapsed_time": "4:41:13", "remaining_time": "0:00:31", "throughput": 4092.87, "total_tokens": 69062616} +{"current_steps": 119145, "total_steps": 119360, "loss": 0.5144, "lr": 9.975695245134642e-11, "epoch": 19.9639745308311, "percentage": 99.82, "elapsed_time": "4:41:14", "remaining_time": "0:00:30", "throughput": 4092.87, "total_tokens": 69065432} +{"current_steps": 119150, "total_steps": 119360, "loss": 0.4981, "lr": 9.51920429503872e-11, "epoch": 19.964812332439678, "percentage": 99.82, "elapsed_time": "4:41:15", "remaining_time": "0:00:29", "throughput": 4092.88, "total_tokens": 69068312} +{"current_steps": 119155, "total_steps": 119360, "loss": 0.2633, "lr": 9.073403865411667e-11, "epoch": 19.965650134048257, "percentage": 99.83, "elapsed_time": "4:41:15", "remaining_time": "0:00:29", "throughput": 4092.89, "total_tokens": 69071224} +{"current_steps": 119160, "total_steps": 119360, "loss": 0.2487, "lr": 8.638293965856914e-11, "epoch": 19.966487935656836, "percentage": 99.83, "elapsed_time": "4:41:16", "remaining_time": "0:00:28", "throughput": 4092.91, "total_tokens": 69074328} +{"current_steps": 119165, "total_steps": 119360, "loss": 0.1152, "lr": 8.213874605589311e-11, "epoch": 19.967325737265416, "percentage": 99.84, "elapsed_time": "4:41:17", "remaining_time": "0:00:27", "throughput": 4092.92, "total_tokens": 69077112} +{"current_steps": 119170, "total_steps": 119360, "loss": 0.1801, "lr": 7.800145793712688e-11, "epoch": 19.968163538873995, "percentage": 99.84, "elapsed_time": "4:41:17", "remaining_time": "0:00:26", "throughput": 4092.92, "total_tokens": 69079960} +{"current_steps": 119175, "total_steps": 119360, "loss": 0.2107, "lr": 7.397107539053316e-11, "epoch": 19.969001340482574, "percentage": 99.85, "elapsed_time": "4:41:18", "remaining_time": "0:00:26", "throughput": 4092.94, "total_tokens": 69082968} +{"current_steps": 119180, "total_steps": 119360, "loss": 0.3554, "lr": 7.004759850326448e-11, "epoch": 19.969839142091153, "percentage": 99.85, "elapsed_time": "4:41:19", "remaining_time": "0:00:25", "throughput": 4092.94, "total_tokens": 69085592} +{"current_steps": 119185, "total_steps": 119360, "loss": 0.2006, "lr": 6.623102735803244e-11, "epoch": 19.970676943699733, "percentage": 99.85, "elapsed_time": "4:41:19", "remaining_time": "0:00:24", "throughput": 4092.95, "total_tokens": 69088696} +{"current_steps": 119190, "total_steps": 119360, "loss": 0.5264, "lr": 6.252136203699355e-11, "epoch": 19.971514745308312, "percentage": 99.86, "elapsed_time": "4:41:20", "remaining_time": "0:00:24", "throughput": 4092.97, "total_tokens": 69091864} +{"current_steps": 119195, "total_steps": 119360, "loss": 0.557, "lr": 5.891860261897364e-11, "epoch": 19.97235254691689, "percentage": 99.86, "elapsed_time": "4:41:21", "remaining_time": "0:00:23", "throughput": 4092.98, "total_tokens": 69094936} +{"current_steps": 119200, "total_steps": 119360, "loss": 0.5124, "lr": 5.5422749181688326e-11, "epoch": 19.97319034852547, "percentage": 99.87, "elapsed_time": "4:41:22", "remaining_time": "0:00:22", "throughput": 4093.0, "total_tokens": 69098552} +{"current_steps": 119205, "total_steps": 119360, "loss": 0.1176, "lr": 5.203380180007767e-11, "epoch": 19.97402815013405, "percentage": 99.87, "elapsed_time": "4:41:22", "remaining_time": "0:00:21", "throughput": 4093.01, "total_tokens": 69101528} +{"current_steps": 119210, "total_steps": 119360, "loss": 0.286, "lr": 4.8751760545751035e-11, "epoch": 19.97486595174263, "percentage": 99.87, "elapsed_time": "4:41:23", "remaining_time": "0:00:21", "throughput": 4093.03, "total_tokens": 69104792} +{"current_steps": 119215, "total_steps": 119360, "loss": 0.2809, "lr": 4.5576625489207606e-11, "epoch": 19.975703753351205, "percentage": 99.88, "elapsed_time": "4:41:24", "remaining_time": "0:00:20", "throughput": 4093.04, "total_tokens": 69107576} +{"current_steps": 119220, "total_steps": 119360, "loss": 0.4476, "lr": 4.2508396698170973e-11, "epoch": 19.976541554959784, "percentage": 99.88, "elapsed_time": "4:41:24", "remaining_time": "0:00:19", "throughput": 4093.04, "total_tokens": 69110456} +{"current_steps": 119225, "total_steps": 119360, "loss": 0.2164, "lr": 3.954707423869941e-11, "epoch": 19.977379356568363, "percentage": 99.89, "elapsed_time": "4:41:25", "remaining_time": "0:00:19", "throughput": 4093.04, "total_tokens": 69113176} +{"current_steps": 119230, "total_steps": 119360, "loss": 0.4417, "lr": 3.669265817407564e-11, "epoch": 19.978217158176943, "percentage": 99.89, "elapsed_time": "4:41:26", "remaining_time": "0:00:18", "throughput": 4093.06, "total_tokens": 69116088} +{"current_steps": 119235, "total_steps": 119360, "loss": 0.1217, "lr": 3.3945148564806794e-11, "epoch": 19.979054959785522, "percentage": 99.9, "elapsed_time": "4:41:26", "remaining_time": "0:00:17", "throughput": 4093.07, "total_tokens": 69118968} +{"current_steps": 119240, "total_steps": 119360, "loss": 0.3273, "lr": 3.1304545469734716e-11, "epoch": 19.9798927613941, "percentage": 99.9, "elapsed_time": "4:41:27", "remaining_time": "0:00:16", "throughput": 4093.08, "total_tokens": 69122008} +{"current_steps": 119245, "total_steps": 119360, "loss": 0.3353, "lr": 2.8770848946035878e-11, "epoch": 19.98073056300268, "percentage": 99.9, "elapsed_time": "4:41:28", "remaining_time": "0:00:16", "throughput": 4093.09, "total_tokens": 69125048} +{"current_steps": 119250, "total_steps": 119360, "loss": 0.1693, "lr": 2.6344059047556103e-11, "epoch": 19.98156836461126, "percentage": 99.91, "elapsed_time": "4:41:28", "remaining_time": "0:00:15", "throughput": 4093.1, "total_tokens": 69128088} +{"current_steps": 119255, "total_steps": 119360, "loss": 0.2716, "lr": 2.4024175825365647e-11, "epoch": 19.98240616621984, "percentage": 99.91, "elapsed_time": "4:41:29", "remaining_time": "0:00:14", "throughput": 4093.11, "total_tokens": 69131032} +{"current_steps": 119260, "total_steps": 119360, "loss": 0.4149, "lr": 2.181119932997966e-11, "epoch": 19.983243967828418, "percentage": 99.92, "elapsed_time": "4:41:30", "remaining_time": "0:00:14", "throughput": 4093.12, "total_tokens": 69134104} +{"current_steps": 119265, "total_steps": 119360, "loss": 0.3103, "lr": 1.9705129608582618e-11, "epoch": 19.984081769436997, "percentage": 99.92, "elapsed_time": "4:41:30", "remaining_time": "0:00:13", "throughput": 4093.12, "total_tokens": 69136856} +{"current_steps": 119270, "total_steps": 119360, "loss": 0.4018, "lr": 1.7705966706138557e-11, "epoch": 19.984919571045577, "percentage": 99.92, "elapsed_time": "4:41:31", "remaining_time": "0:00:12", "throughput": 4093.14, "total_tokens": 69139832} +{"current_steps": 119275, "total_steps": 119360, "loss": 0.2237, "lr": 1.581371066539106e-11, "epoch": 19.985757372654156, "percentage": 99.93, "elapsed_time": "4:41:32", "remaining_time": "0:00:12", "throughput": 4093.14, "total_tokens": 69142616} +{"current_steps": 119280, "total_steps": 119360, "loss": 0.4371, "lr": 1.4028361526308155e-11, "epoch": 19.986595174262735, "percentage": 99.93, "elapsed_time": "4:41:32", "remaining_time": "0:00:11", "throughput": 4093.14, "total_tokens": 69145272} +{"current_steps": 119285, "total_steps": 119360, "loss": 0.5699, "lr": 1.2349919327747651e-11, "epoch": 19.987432975871315, "percentage": 99.94, "elapsed_time": "4:41:33", "remaining_time": "0:00:10", "throughput": 4093.15, "total_tokens": 69148344} +{"current_steps": 119290, "total_steps": 119360, "loss": 0.6418, "lr": 1.0778384105236683e-11, "epoch": 19.988270777479894, "percentage": 99.94, "elapsed_time": "4:41:34", "remaining_time": "0:00:09", "throughput": 4093.16, "total_tokens": 69150936} +{"current_steps": 119295, "total_steps": 119360, "loss": 0.1985, "lr": 9.313755892637055e-12, "epoch": 19.989108579088473, "percentage": 99.95, "elapsed_time": "4:41:34", "remaining_time": "0:00:09", "throughput": 4093.17, "total_tokens": 69153784} +{"current_steps": 119300, "total_steps": 119360, "loss": 0.203, "lr": 7.95603472103501e-12, "epoch": 19.989946380697052, "percentage": 99.95, "elapsed_time": "4:41:35", "remaining_time": "0:00:08", "throughput": 4093.17, "total_tokens": 69156600} +{"current_steps": 119305, "total_steps": 119360, "loss": 0.2808, "lr": 6.7052206198514606e-12, "epoch": 19.99078418230563, "percentage": 99.95, "elapsed_time": "4:41:36", "remaining_time": "0:00:07", "throughput": 4093.19, "total_tokens": 69159736} +{"current_steps": 119310, "total_steps": 119360, "loss": 0.165, "lr": 5.561313615176644e-12, "epoch": 19.991621983914207, "percentage": 99.96, "elapsed_time": "4:41:37", "remaining_time": "0:00:07", "throughput": 4093.2, "total_tokens": 69162808} +{"current_steps": 119315, "total_steps": 119360, "loss": 0.3076, "lr": 4.52431373143547e-12, "epoch": 19.992459785522787, "percentage": 99.96, "elapsed_time": "4:41:37", "remaining_time": "0:00:06", "throughput": 4093.2, "total_tokens": 69165624} +{"current_steps": 119320, "total_steps": 119360, "loss": 0.4274, "lr": 3.594220991942621e-12, "epoch": 19.993297587131366, "percentage": 99.97, "elapsed_time": "4:41:38", "remaining_time": "0:00:05", "throughput": 4093.21, "total_tokens": 69168664} +{"current_steps": 119325, "total_steps": 119360, "loss": 0.3873, "lr": 2.7710354155718875e-12, "epoch": 19.994135388739945, "percentage": 99.97, "elapsed_time": "4:41:39", "remaining_time": "0:00:04", "throughput": 4093.21, "total_tokens": 69171448} +{"current_steps": 119330, "total_steps": 119360, "loss": 0.3688, "lr": 2.0547570200868395e-12, "epoch": 19.994973190348524, "percentage": 99.97, "elapsed_time": "4:41:39", "remaining_time": "0:00:04", "throughput": 4093.23, "total_tokens": 69174680} +{"current_steps": 119335, "total_steps": 119360, "loss": 0.1076, "lr": 1.4453858204754866e-12, "epoch": 19.995810991957104, "percentage": 99.98, "elapsed_time": "4:41:40", "remaining_time": "0:00:03", "throughput": 4093.24, "total_tokens": 69177816} +{"current_steps": 119340, "total_steps": 119360, "loss": 0.3217, "lr": 9.429218306156173e-13, "epoch": 19.996648793565683, "percentage": 99.98, "elapsed_time": "4:41:41", "remaining_time": "0:00:02", "throughput": 4093.25, "total_tokens": 69180632} +{"current_steps": 119345, "total_steps": 119360, "loss": 0.3804, "lr": 5.473650610543502e-13, "epoch": 19.997486595174262, "percentage": 99.99, "elapsed_time": "4:41:41", "remaining_time": "0:00:02", "throughput": 4093.26, "total_tokens": 69183480} +{"current_steps": 119350, "total_steps": 119360, "loss": 0.4557, "lr": 2.5871551956324624e-13, "epoch": 19.99832439678284, "percentage": 99.99, "elapsed_time": "4:41:42", "remaining_time": "0:00:01", "throughput": 4093.27, "total_tokens": 69186328} +{"current_steps": 119355, "total_steps": 119360, "loss": 0.3563, "lr": 7.697321280364378e-14, "epoch": 19.99916219839142, "percentage": 100.0, "elapsed_time": "4:41:43", "remaining_time": "0:00:00", "throughput": 4093.28, "total_tokens": 69189240} +{"current_steps": 119360, "total_steps": 119360, "loss": 0.2774, "lr": 2.1381446613233382e-15, "epoch": 20.0, "percentage": 100.0, "elapsed_time": "4:41:43", "remaining_time": "0:00:00", "throughput": 4093.26, "total_tokens": 69191680} +{"current_steps": 119360, "total_steps": 119360, "eval_loss": 1.499447226524353, "epoch": 20.0, "percentage": 100.0, "elapsed_time": "4:43:13", "remaining_time": "0:00:00", "throughput": 4071.63, "total_tokens": 69191680} +{"current_steps": 119360, "total_steps": 119360, "epoch": 20.0, "percentage": 100.0, "elapsed_time": "4:43:15", "remaining_time": "0:00:00", "throughput": 4071.2, "total_tokens": 69191680}