diff --git "a/trainer_log.jsonl" "b/trainer_log.jsonl" --- "a/trainer_log.jsonl" +++ "b/trainer_log.jsonl" @@ -6118,3 +6118,678 @@ {"current_steps": 30545, "total_steps": 33920, "loss": 0.3001, "lr": 2.9872752215055755e-07, "epoch": 18.01002358490566, "percentage": 90.05, "elapsed_time": "0:59:18", "remaining_time": "0:06:33", "throughput": 5651.52, "total_tokens": 20108160} {"current_steps": 30550, "total_steps": 33920, "loss": 0.3134, "lr": 2.9785220627555844e-07, "epoch": 18.01297169811321, "percentage": 90.06, "elapsed_time": "0:59:18", "remaining_time": "0:06:32", "throughput": 5651.64, "total_tokens": 20112736} {"current_steps": 30555, "total_steps": 33920, "loss": 0.3682, "lr": 2.9697813531445295e-07, "epoch": 18.015919811320753, "percentage": 90.08, "elapsed_time": "0:59:19", "remaining_time": "0:06:31", "throughput": 5651.57, "total_tokens": 20115840} +{"current_steps": 30560, "total_steps": 33920, "loss": 0.2745, "lr": 2.9610530949865433e-07, "epoch": 18.0188679245283, "percentage": 90.09, "elapsed_time": "0:59:19", "remaining_time": "0:06:31", "throughput": 5651.58, "total_tokens": 20119200} +{"current_steps": 30565, "total_steps": 33920, "loss": 0.3283, "lr": 2.952337290592483e-07, "epoch": 18.02181603773585, "percentage": 90.11, "elapsed_time": "0:59:20", "remaining_time": "0:06:30", "throughput": 5651.67, "total_tokens": 20122720} +{"current_steps": 30570, "total_steps": 33920, "loss": 0.266, "lr": 2.9436339422698913e-07, "epoch": 18.024764150943398, "percentage": 90.12, "elapsed_time": "0:59:21", "remaining_time": "0:06:30", "throughput": 5651.66, "total_tokens": 20125728} +{"current_steps": 30575, "total_steps": 33920, "loss": 0.2899, "lr": 2.934943052323008e-07, "epoch": 18.027712264150942, "percentage": 90.14, "elapsed_time": "0:59:21", "remaining_time": "0:06:29", "throughput": 5651.68, "total_tokens": 20129216} +{"current_steps": 30580, "total_steps": 33920, "loss": 0.4901, "lr": 2.926264623052799e-07, "epoch": 18.03066037735849, "percentage": 90.15, "elapsed_time": "0:59:22", "remaining_time": "0:06:29", "throughput": 5651.84, "total_tokens": 20135008} +{"current_steps": 30585, "total_steps": 33920, "loss": 0.2576, "lr": 2.9175986567569036e-07, "epoch": 18.03360849056604, "percentage": 90.17, "elapsed_time": "0:59:23", "remaining_time": "0:06:28", "throughput": 5651.91, "total_tokens": 20138272} +{"current_steps": 30590, "total_steps": 33920, "loss": 0.3203, "lr": 2.9089451557296755e-07, "epoch": 18.036556603773583, "percentage": 90.18, "elapsed_time": "0:59:23", "remaining_time": "0:06:27", "throughput": 5651.89, "total_tokens": 20141536} +{"current_steps": 30595, "total_steps": 33920, "loss": 0.2677, "lr": 2.9003041222621706e-07, "epoch": 18.03950471698113, "percentage": 90.2, "elapsed_time": "0:59:24", "remaining_time": "0:06:27", "throughput": 5652.0, "total_tokens": 20145728} +{"current_steps": 30600, "total_steps": 33920, "loss": 0.3314, "lr": 2.8916755586421375e-07, "epoch": 18.04245283018868, "percentage": 90.21, "elapsed_time": "0:59:24", "remaining_time": "0:06:26", "throughput": 5651.91, "total_tokens": 20148544} +{"current_steps": 30605, "total_steps": 33920, "loss": 0.333, "lr": 2.883059467154031e-07, "epoch": 18.045400943396228, "percentage": 90.23, "elapsed_time": "0:59:25", "remaining_time": "0:06:26", "throughput": 5651.93, "total_tokens": 20151904} +{"current_steps": 30610, "total_steps": 33920, "loss": 0.335, "lr": 2.8744558500789887e-07, "epoch": 18.048349056603772, "percentage": 90.24, "elapsed_time": "0:59:26", "remaining_time": "0:06:25", "throughput": 5651.94, "total_tokens": 20155264} +{"current_steps": 30615, "total_steps": 33920, "loss": 0.2517, "lr": 2.8658647096948546e-07, "epoch": 18.05129716981132, "percentage": 90.26, "elapsed_time": "0:59:26", "remaining_time": "0:06:25", "throughput": 5651.9, "total_tokens": 20158240} +{"current_steps": 30620, "total_steps": 33920, "loss": 0.2661, "lr": 2.8572860482761813e-07, "epoch": 18.05424528301887, "percentage": 90.27, "elapsed_time": "0:59:27", "remaining_time": "0:06:24", "throughput": 5651.89, "total_tokens": 20161344} +{"current_steps": 30625, "total_steps": 33920, "loss": 0.282, "lr": 2.8487198680942017e-07, "epoch": 18.057193396226417, "percentage": 90.29, "elapsed_time": "0:59:27", "remaining_time": "0:06:23", "throughput": 5651.8, "total_tokens": 20164192} +{"current_steps": 30630, "total_steps": 33920, "loss": 0.3425, "lr": 2.840166171416836e-07, "epoch": 18.06014150943396, "percentage": 90.3, "elapsed_time": "0:59:28", "remaining_time": "0:06:23", "throughput": 5651.75, "total_tokens": 20167456} +{"current_steps": 30635, "total_steps": 33920, "loss": 0.2527, "lr": 2.8316249605087386e-07, "epoch": 18.06308962264151, "percentage": 90.32, "elapsed_time": "0:59:28", "remaining_time": "0:06:22", "throughput": 5651.61, "total_tokens": 20169920} +{"current_steps": 30640, "total_steps": 33920, "loss": 0.494, "lr": 2.823096237631212e-07, "epoch": 18.066037735849058, "percentage": 90.33, "elapsed_time": "0:59:29", "remaining_time": "0:06:22", "throughput": 5651.58, "total_tokens": 20172896} +{"current_steps": 30645, "total_steps": 33920, "loss": 0.2346, "lr": 2.814580005042283e-07, "epoch": 18.068985849056602, "percentage": 90.34, "elapsed_time": "0:59:30", "remaining_time": "0:06:21", "throughput": 5651.66, "total_tokens": 20177024} +{"current_steps": 30650, "total_steps": 33920, "loss": 0.3488, "lr": 2.8060762649966435e-07, "epoch": 18.07193396226415, "percentage": 90.36, "elapsed_time": "0:59:30", "remaining_time": "0:06:20", "throughput": 5651.66, "total_tokens": 20180416} +{"current_steps": 30655, "total_steps": 33920, "loss": 0.2322, "lr": 2.797585019745713e-07, "epoch": 18.0748820754717, "percentage": 90.37, "elapsed_time": "0:59:31", "remaining_time": "0:06:20", "throughput": 5651.7, "total_tokens": 20183840} +{"current_steps": 30660, "total_steps": 33920, "loss": 0.4089, "lr": 2.789106271537584e-07, "epoch": 18.077830188679247, "percentage": 90.39, "elapsed_time": "0:59:31", "remaining_time": "0:06:19", "throughput": 5651.68, "total_tokens": 20186784} +{"current_steps": 30665, "total_steps": 33920, "loss": 0.2981, "lr": 2.780640022617037e-07, "epoch": 18.08077830188679, "percentage": 90.4, "elapsed_time": "0:59:32", "remaining_time": "0:06:19", "throughput": 5651.61, "total_tokens": 20189440} +{"current_steps": 30670, "total_steps": 33920, "loss": 0.3085, "lr": 2.772186275225547e-07, "epoch": 18.08372641509434, "percentage": 90.42, "elapsed_time": "0:59:32", "remaining_time": "0:06:18", "throughput": 5651.48, "total_tokens": 20191936} +{"current_steps": 30675, "total_steps": 33920, "loss": 0.3451, "lr": 2.7637450316012836e-07, "epoch": 18.086674528301888, "percentage": 90.43, "elapsed_time": "0:59:33", "remaining_time": "0:06:18", "throughput": 5651.68, "total_tokens": 20196288} +{"current_steps": 30680, "total_steps": 33920, "loss": 0.3475, "lr": 2.755316293979088e-07, "epoch": 18.089622641509433, "percentage": 90.45, "elapsed_time": "0:59:34", "remaining_time": "0:06:17", "throughput": 5651.87, "total_tokens": 20203232} +{"current_steps": 30685, "total_steps": 33920, "loss": 0.3314, "lr": 2.7469000645905295e-07, "epoch": 18.09257075471698, "percentage": 90.46, "elapsed_time": "0:59:35", "remaining_time": "0:06:16", "throughput": 5651.91, "total_tokens": 20206752} +{"current_steps": 30690, "total_steps": 33920, "loss": 0.3292, "lr": 2.738496345663827e-07, "epoch": 18.09551886792453, "percentage": 90.48, "elapsed_time": "0:59:35", "remaining_time": "0:06:16", "throughput": 5652.01, "total_tokens": 20210400} +{"current_steps": 30695, "total_steps": 33920, "loss": 0.2567, "lr": 2.7301051394239e-07, "epoch": 18.098466981132077, "percentage": 90.49, "elapsed_time": "0:59:36", "remaining_time": "0:06:15", "throughput": 5652.01, "total_tokens": 20213664} +{"current_steps": 30700, "total_steps": 33920, "loss": 0.2703, "lr": 2.72172644809236e-07, "epoch": 18.10141509433962, "percentage": 90.51, "elapsed_time": "0:59:36", "remaining_time": "0:06:15", "throughput": 5652.03, "total_tokens": 20217056} +{"current_steps": 30705, "total_steps": 33920, "loss": 0.242, "lr": 2.7133602738875e-07, "epoch": 18.10436320754717, "percentage": 90.52, "elapsed_time": "0:59:37", "remaining_time": "0:06:14", "throughput": 5652.09, "total_tokens": 20220480} +{"current_steps": 30710, "total_steps": 33920, "loss": 0.315, "lr": 2.7050066190242976e-07, "epoch": 18.107311320754718, "percentage": 90.54, "elapsed_time": "0:59:38", "remaining_time": "0:06:14", "throughput": 5652.32, "total_tokens": 20227424} +{"current_steps": 30715, "total_steps": 33920, "loss": 0.309, "lr": 2.696665485714428e-07, "epoch": 18.110259433962263, "percentage": 90.55, "elapsed_time": "0:59:39", "remaining_time": "0:06:13", "throughput": 5652.47, "total_tokens": 20231424} +{"current_steps": 30720, "total_steps": 33920, "loss": 0.295, "lr": 2.6883368761662367e-07, "epoch": 18.11320754716981, "percentage": 90.57, "elapsed_time": "0:59:39", "remaining_time": "0:06:12", "throughput": 5652.48, "total_tokens": 20234464} +{"current_steps": 30725, "total_steps": 33920, "loss": 0.435, "lr": 2.680020792584759e-07, "epoch": 18.11615566037736, "percentage": 90.58, "elapsed_time": "0:59:40", "remaining_time": "0:06:12", "throughput": 5652.56, "total_tokens": 20237888} +{"current_steps": 30730, "total_steps": 33920, "loss": 0.3982, "lr": 2.6717172371717113e-07, "epoch": 18.119103773584907, "percentage": 90.6, "elapsed_time": "0:59:40", "remaining_time": "0:06:11", "throughput": 5652.52, "total_tokens": 20240640} +{"current_steps": 30735, "total_steps": 33920, "loss": 0.4454, "lr": 2.663426212125503e-07, "epoch": 18.122051886792452, "percentage": 90.61, "elapsed_time": "0:59:41", "remaining_time": "0:06:11", "throughput": 5652.57, "total_tokens": 20244224} +{"current_steps": 30740, "total_steps": 33920, "loss": 0.3238, "lr": 2.655147719641216e-07, "epoch": 18.125, "percentage": 90.62, "elapsed_time": "0:59:42", "remaining_time": "0:06:10", "throughput": 5652.69, "total_tokens": 20248128} +{"current_steps": 30745, "total_steps": 33920, "loss": 0.3743, "lr": 2.646881761910602e-07, "epoch": 18.127948113207548, "percentage": 90.64, "elapsed_time": "0:59:42", "remaining_time": "0:06:09", "throughput": 5652.82, "total_tokens": 20252160} +{"current_steps": 30750, "total_steps": 33920, "loss": 0.2597, "lr": 2.638628341122135e-07, "epoch": 18.130896226415093, "percentage": 90.65, "elapsed_time": "0:59:43", "remaining_time": "0:06:09", "throughput": 5652.78, "total_tokens": 20255488} +{"current_steps": 30755, "total_steps": 33920, "loss": 0.2966, "lr": 2.6303874594609314e-07, "epoch": 18.13384433962264, "percentage": 90.67, "elapsed_time": "0:59:43", "remaining_time": "0:06:08", "throughput": 5652.82, "total_tokens": 20258720} +{"current_steps": 30760, "total_steps": 33920, "loss": 0.3143, "lr": 2.622159119108797e-07, "epoch": 18.13679245283019, "percentage": 90.68, "elapsed_time": "0:59:44", "remaining_time": "0:06:08", "throughput": 5652.8, "total_tokens": 20261728} +{"current_steps": 30765, "total_steps": 33920, "loss": 0.1921, "lr": 2.6139433222442226e-07, "epoch": 18.139740566037737, "percentage": 90.7, "elapsed_time": "0:59:45", "remaining_time": "0:06:07", "throughput": 5652.87, "total_tokens": 20265696} +{"current_steps": 30770, "total_steps": 33920, "loss": 0.2661, "lr": 2.6057400710423787e-07, "epoch": 18.142688679245282, "percentage": 90.71, "elapsed_time": "0:59:45", "remaining_time": "0:06:07", "throughput": 5653.01, "total_tokens": 20269248} +{"current_steps": 30775, "total_steps": 33920, "loss": 0.3622, "lr": 2.5975493676751004e-07, "epoch": 18.14563679245283, "percentage": 90.73, "elapsed_time": "0:59:46", "remaining_time": "0:06:06", "throughput": 5653.06, "total_tokens": 20272896} +{"current_steps": 30780, "total_steps": 33920, "loss": 0.2917, "lr": 2.589371214310926e-07, "epoch": 18.14858490566038, "percentage": 90.74, "elapsed_time": "0:59:46", "remaining_time": "0:06:05", "throughput": 5653.05, "total_tokens": 20275744} +{"current_steps": 30785, "total_steps": 33920, "loss": 0.2928, "lr": 2.581205613115051e-07, "epoch": 18.151533018867923, "percentage": 90.76, "elapsed_time": "0:59:47", "remaining_time": "0:06:05", "throughput": 5652.92, "total_tokens": 20278368} +{"current_steps": 30790, "total_steps": 33920, "loss": 0.3468, "lr": 2.573052566249357e-07, "epoch": 18.15448113207547, "percentage": 90.77, "elapsed_time": "0:59:47", "remaining_time": "0:06:04", "throughput": 5652.85, "total_tokens": 20281120} +{"current_steps": 30795, "total_steps": 33920, "loss": 0.3574, "lr": 2.5649120758723945e-07, "epoch": 18.15742924528302, "percentage": 90.79, "elapsed_time": "0:59:48", "remaining_time": "0:06:04", "throughput": 5652.75, "total_tokens": 20283712} +{"current_steps": 30800, "total_steps": 33920, "loss": 0.2377, "lr": 2.5567841441393906e-07, "epoch": 18.160377358490567, "percentage": 90.8, "elapsed_time": "0:59:48", "remaining_time": "0:06:03", "throughput": 5652.75, "total_tokens": 20287072} +{"current_steps": 30805, "total_steps": 33920, "loss": 0.3674, "lr": 2.548668773202245e-07, "epoch": 18.163325471698112, "percentage": 90.82, "elapsed_time": "0:59:49", "remaining_time": "0:06:02", "throughput": 5652.83, "total_tokens": 20290816} +{"current_steps": 30810, "total_steps": 33920, "loss": 0.2954, "lr": 2.5405659652095573e-07, "epoch": 18.16627358490566, "percentage": 90.83, "elapsed_time": "0:59:50", "remaining_time": "0:06:02", "throughput": 5652.86, "total_tokens": 20293920} +{"current_steps": 30815, "total_steps": 33920, "loss": 0.3877, "lr": 2.5324757223065655e-07, "epoch": 18.16922169811321, "percentage": 90.85, "elapsed_time": "0:59:50", "remaining_time": "0:06:01", "throughput": 5653.06, "total_tokens": 20298720} +{"current_steps": 30820, "total_steps": 33920, "loss": 0.2492, "lr": 2.524398046635207e-07, "epoch": 18.172169811320753, "percentage": 90.86, "elapsed_time": "0:59:51", "remaining_time": "0:06:01", "throughput": 5653.21, "total_tokens": 20303424} +{"current_steps": 30825, "total_steps": 33920, "loss": 0.2431, "lr": 2.51633294033406e-07, "epoch": 18.1751179245283, "percentage": 90.88, "elapsed_time": "0:59:52", "remaining_time": "0:06:00", "throughput": 5653.2, "total_tokens": 20306400} +{"current_steps": 30830, "total_steps": 33920, "loss": 0.3308, "lr": 2.5082804055384214e-07, "epoch": 18.17806603773585, "percentage": 90.89, "elapsed_time": "0:59:52", "remaining_time": "0:06:00", "throughput": 5653.22, "total_tokens": 20309440} +{"current_steps": 30835, "total_steps": 33920, "loss": 0.3599, "lr": 2.50024044438022e-07, "epoch": 18.181014150943398, "percentage": 90.91, "elapsed_time": "0:59:53", "remaining_time": "0:05:59", "throughput": 5653.25, "total_tokens": 20312736} +{"current_steps": 30840, "total_steps": 33920, "loss": 0.2549, "lr": 2.492213058988069e-07, "epoch": 18.183962264150942, "percentage": 90.92, "elapsed_time": "0:59:53", "remaining_time": "0:05:58", "throughput": 5653.16, "total_tokens": 20315424} +{"current_steps": 30845, "total_steps": 33920, "loss": 0.3904, "lr": 2.4841982514872633e-07, "epoch": 18.18691037735849, "percentage": 90.93, "elapsed_time": "0:59:54", "remaining_time": "0:05:58", "throughput": 5653.06, "total_tokens": 20318176} +{"current_steps": 30850, "total_steps": 33920, "loss": 0.4196, "lr": 2.4761960239997497e-07, "epoch": 18.18985849056604, "percentage": 90.95, "elapsed_time": "0:59:55", "remaining_time": "0:05:57", "throughput": 5653.26, "total_tokens": 20324320} +{"current_steps": 30855, "total_steps": 33920, "loss": 0.1906, "lr": 2.4682063786441556e-07, "epoch": 18.192806603773583, "percentage": 90.96, "elapsed_time": "0:59:55", "remaining_time": "0:05:57", "throughput": 5653.21, "total_tokens": 20327136} +{"current_steps": 30860, "total_steps": 33920, "loss": 0.2517, "lr": 2.460229317535778e-07, "epoch": 18.19575471698113, "percentage": 90.98, "elapsed_time": "0:59:56", "remaining_time": "0:05:56", "throughput": 5653.25, "total_tokens": 20330816} +{"current_steps": 30865, "total_steps": 33920, "loss": 0.2761, "lr": 2.4522648427865725e-07, "epoch": 18.19870283018868, "percentage": 90.99, "elapsed_time": "0:59:56", "remaining_time": "0:05:56", "throughput": 5653.22, "total_tokens": 20333696} +{"current_steps": 30870, "total_steps": 33920, "loss": 0.4167, "lr": 2.444312956505163e-07, "epoch": 18.201650943396228, "percentage": 91.01, "elapsed_time": "0:59:57", "remaining_time": "0:05:55", "throughput": 5653.25, "total_tokens": 20336768} +{"current_steps": 30875, "total_steps": 33920, "loss": 0.2687, "lr": 2.4363736607968537e-07, "epoch": 18.204599056603772, "percentage": 91.02, "elapsed_time": "0:59:57", "remaining_time": "0:05:54", "throughput": 5653.2, "total_tokens": 20339552} +{"current_steps": 30880, "total_steps": 33920, "loss": 0.2761, "lr": 2.428446957763608e-07, "epoch": 18.20754716981132, "percentage": 91.04, "elapsed_time": "0:59:58", "remaining_time": "0:05:54", "throughput": 5653.16, "total_tokens": 20343136} +{"current_steps": 30885, "total_steps": 33920, "loss": 0.3296, "lr": 2.4205328495040535e-07, "epoch": 18.21049528301887, "percentage": 91.05, "elapsed_time": "0:59:59", "remaining_time": "0:05:53", "throughput": 5652.95, "total_tokens": 20345728} +{"current_steps": 30890, "total_steps": 33920, "loss": 0.2712, "lr": 2.412631338113486e-07, "epoch": 18.213443396226417, "percentage": 91.07, "elapsed_time": "0:59:59", "remaining_time": "0:05:53", "throughput": 5652.94, "total_tokens": 20348832} +{"current_steps": 30895, "total_steps": 33920, "loss": 0.3167, "lr": 2.404742425683848e-07, "epoch": 18.21639150943396, "percentage": 91.08, "elapsed_time": "1:00:00", "remaining_time": "0:05:52", "throughput": 5653.08, "total_tokens": 20352896} +{"current_steps": 30900, "total_steps": 33920, "loss": 0.3657, "lr": 2.3968661143037864e-07, "epoch": 18.21933962264151, "percentage": 91.1, "elapsed_time": "1:00:00", "remaining_time": "0:05:51", "throughput": 5652.91, "total_tokens": 20355584} +{"current_steps": 30905, "total_steps": 33920, "loss": 0.393, "lr": 2.3890024060585823e-07, "epoch": 18.222287735849058, "percentage": 91.11, "elapsed_time": "1:00:01", "remaining_time": "0:05:51", "throughput": 5652.98, "total_tokens": 20359072} +{"current_steps": 30910, "total_steps": 33920, "loss": 0.3193, "lr": 2.3811513030301826e-07, "epoch": 18.225235849056602, "percentage": 91.13, "elapsed_time": "1:00:02", "remaining_time": "0:05:50", "throughput": 5652.88, "total_tokens": 20361696} +{"current_steps": 30915, "total_steps": 33920, "loss": 0.2675, "lr": 2.373312807297201e-07, "epoch": 18.22818396226415, "percentage": 91.14, "elapsed_time": "1:00:02", "remaining_time": "0:05:50", "throughput": 5652.98, "total_tokens": 20365888} +{"current_steps": 30920, "total_steps": 33920, "loss": 0.3274, "lr": 2.3654869209349007e-07, "epoch": 18.2311320754717, "percentage": 91.16, "elapsed_time": "1:00:03", "remaining_time": "0:05:49", "throughput": 5653.02, "total_tokens": 20369120} +{"current_steps": 30925, "total_steps": 33920, "loss": 0.2737, "lr": 2.357673646015246e-07, "epoch": 18.234080188679247, "percentage": 91.17, "elapsed_time": "1:00:03", "remaining_time": "0:05:49", "throughput": 5652.99, "total_tokens": 20372000} +{"current_steps": 30930, "total_steps": 33920, "loss": 0.3645, "lr": 2.3498729846068103e-07, "epoch": 18.23702830188679, "percentage": 91.19, "elapsed_time": "1:00:04", "remaining_time": "0:05:48", "throughput": 5653.03, "total_tokens": 20375104} +{"current_steps": 30935, "total_steps": 33920, "loss": 0.2738, "lr": 2.342084938774869e-07, "epoch": 18.23997641509434, "percentage": 91.2, "elapsed_time": "1:00:04", "remaining_time": "0:05:47", "throughput": 5652.88, "total_tokens": 20377472} +{"current_steps": 30940, "total_steps": 33920, "loss": 0.2884, "lr": 2.334309510581334e-07, "epoch": 18.242924528301888, "percentage": 91.21, "elapsed_time": "1:00:05", "remaining_time": "0:05:47", "throughput": 5652.65, "total_tokens": 20379744} +{"current_steps": 30945, "total_steps": 33920, "loss": 0.2372, "lr": 2.3265467020847864e-07, "epoch": 18.245872641509433, "percentage": 91.23, "elapsed_time": "1:00:05", "remaining_time": "0:05:46", "throughput": 5652.5, "total_tokens": 20382144} +{"current_steps": 30950, "total_steps": 33920, "loss": 0.3478, "lr": 2.31879651534046e-07, "epoch": 18.24882075471698, "percentage": 91.24, "elapsed_time": "1:00:06", "remaining_time": "0:05:46", "throughput": 5652.53, "total_tokens": 20385344} +{"current_steps": 30955, "total_steps": 33920, "loss": 0.3735, "lr": 2.311058952400247e-07, "epoch": 18.25176886792453, "percentage": 91.26, "elapsed_time": "1:00:06", "remaining_time": "0:05:45", "throughput": 5652.49, "total_tokens": 20388224} +{"current_steps": 30960, "total_steps": 33920, "loss": 0.2429, "lr": 2.3033340153127026e-07, "epoch": 18.254716981132077, "percentage": 91.27, "elapsed_time": "1:00:07", "remaining_time": "0:05:44", "throughput": 5652.48, "total_tokens": 20391040} +{"current_steps": 30965, "total_steps": 33920, "loss": 0.2721, "lr": 2.295621706123041e-07, "epoch": 18.25766509433962, "percentage": 91.29, "elapsed_time": "1:00:08", "remaining_time": "0:05:44", "throughput": 5652.44, "total_tokens": 20394208} +{"current_steps": 30970, "total_steps": 33920, "loss": 0.3591, "lr": 2.287922026873135e-07, "epoch": 18.26061320754717, "percentage": 91.3, "elapsed_time": "1:00:08", "remaining_time": "0:05:43", "throughput": 5652.43, "total_tokens": 20397248} +{"current_steps": 30975, "total_steps": 33920, "loss": 0.303, "lr": 2.2802349796014923e-07, "epoch": 18.263561320754718, "percentage": 91.32, "elapsed_time": "1:00:09", "remaining_time": "0:05:43", "throughput": 5652.49, "total_tokens": 20401408} +{"current_steps": 30980, "total_steps": 33920, "loss": 0.308, "lr": 2.2725605663433013e-07, "epoch": 18.266509433962263, "percentage": 91.33, "elapsed_time": "1:00:09", "remaining_time": "0:05:42", "throughput": 5652.62, "total_tokens": 20405824} +{"current_steps": 30985, "total_steps": 33920, "loss": 0.2213, "lr": 2.264898789130393e-07, "epoch": 18.26945754716981, "percentage": 91.35, "elapsed_time": "1:00:10", "remaining_time": "0:05:42", "throughput": 5652.63, "total_tokens": 20408992} +{"current_steps": 30990, "total_steps": 33920, "loss": 0.2893, "lr": 2.2572496499912554e-07, "epoch": 18.27240566037736, "percentage": 91.36, "elapsed_time": "1:00:11", "remaining_time": "0:05:41", "throughput": 5652.69, "total_tokens": 20412320} +{"current_steps": 30995, "total_steps": 33920, "loss": 0.272, "lr": 2.2496131509510354e-07, "epoch": 18.275353773584907, "percentage": 91.38, "elapsed_time": "1:00:11", "remaining_time": "0:05:40", "throughput": 5652.69, "total_tokens": 20415488} +{"current_steps": 31000, "total_steps": 33920, "loss": 0.2071, "lr": 2.2419892940315268e-07, "epoch": 18.278301886792452, "percentage": 91.39, "elapsed_time": "1:00:12", "remaining_time": "0:05:40", "throughput": 5652.76, "total_tokens": 20419136} +{"current_steps": 31005, "total_steps": 33920, "loss": 0.284, "lr": 2.2343780812511819e-07, "epoch": 18.28125, "percentage": 91.41, "elapsed_time": "1:00:12", "remaining_time": "0:05:39", "throughput": 5652.77, "total_tokens": 20422112} +{"current_steps": 31010, "total_steps": 33920, "loss": 0.3187, "lr": 2.2267795146250936e-07, "epoch": 18.284198113207548, "percentage": 91.42, "elapsed_time": "1:00:13", "remaining_time": "0:05:39", "throughput": 5652.7, "total_tokens": 20424896} +{"current_steps": 31015, "total_steps": 33920, "loss": 0.3575, "lr": 2.2191935961650146e-07, "epoch": 18.287146226415093, "percentage": 91.44, "elapsed_time": "1:00:13", "remaining_time": "0:05:38", "throughput": 5652.58, "total_tokens": 20427392} +{"current_steps": 31020, "total_steps": 33920, "loss": 0.3512, "lr": 2.2116203278793603e-07, "epoch": 18.29009433962264, "percentage": 91.45, "elapsed_time": "1:00:14", "remaining_time": "0:05:37", "throughput": 5652.66, "total_tokens": 20431168} +{"current_steps": 31025, "total_steps": 33920, "loss": 0.2465, "lr": 2.2040597117731766e-07, "epoch": 18.29304245283019, "percentage": 91.47, "elapsed_time": "1:00:14", "remaining_time": "0:05:37", "throughput": 5652.57, "total_tokens": 20433824} +{"current_steps": 31030, "total_steps": 33920, "loss": 0.279, "lr": 2.1965117498481793e-07, "epoch": 18.295990566037737, "percentage": 91.48, "elapsed_time": "1:00:15", "remaining_time": "0:05:36", "throughput": 5652.61, "total_tokens": 20436864} +{"current_steps": 31035, "total_steps": 33920, "loss": 0.3014, "lr": 2.188976444102714e-07, "epoch": 18.298938679245282, "percentage": 91.49, "elapsed_time": "1:00:16", "remaining_time": "0:05:36", "throughput": 5652.58, "total_tokens": 20440224} +{"current_steps": 31040, "total_steps": 33920, "loss": 0.4008, "lr": 2.181453796531796e-07, "epoch": 18.30188679245283, "percentage": 91.51, "elapsed_time": "1:00:16", "remaining_time": "0:05:35", "throughput": 5652.53, "total_tokens": 20443232} +{"current_steps": 31045, "total_steps": 33920, "loss": 0.2953, "lr": 2.1739438091270658e-07, "epoch": 18.30483490566038, "percentage": 91.52, "elapsed_time": "1:00:17", "remaining_time": "0:05:34", "throughput": 5652.42, "total_tokens": 20445920} +{"current_steps": 31050, "total_steps": 33920, "loss": 0.3937, "lr": 2.1664464838768329e-07, "epoch": 18.307783018867923, "percentage": 91.54, "elapsed_time": "1:00:17", "remaining_time": "0:05:34", "throughput": 5652.4, "total_tokens": 20449088} +{"current_steps": 31055, "total_steps": 33920, "loss": 0.2997, "lr": 2.1589618227660426e-07, "epoch": 18.31073113207547, "percentage": 91.55, "elapsed_time": "1:00:18", "remaining_time": "0:05:33", "throughput": 5652.38, "total_tokens": 20452224} +{"current_steps": 31060, "total_steps": 33920, "loss": 0.2861, "lr": 2.151489827776293e-07, "epoch": 18.31367924528302, "percentage": 91.57, "elapsed_time": "1:00:18", "remaining_time": "0:05:33", "throughput": 5652.32, "total_tokens": 20455392} +{"current_steps": 31065, "total_steps": 33920, "loss": 0.2955, "lr": 2.1440305008858298e-07, "epoch": 18.316627358490567, "percentage": 91.58, "elapsed_time": "1:00:19", "remaining_time": "0:05:32", "throughput": 5652.2, "total_tokens": 20458336} +{"current_steps": 31070, "total_steps": 33920, "loss": 0.3376, "lr": 2.1365838440695397e-07, "epoch": 18.319575471698112, "percentage": 91.6, "elapsed_time": "1:00:20", "remaining_time": "0:05:32", "throughput": 5652.11, "total_tokens": 20460960} +{"current_steps": 31075, "total_steps": 33920, "loss": 0.2725, "lr": 2.129149859298957e-07, "epoch": 18.32252358490566, "percentage": 91.61, "elapsed_time": "1:00:20", "remaining_time": "0:05:31", "throughput": 5652.02, "total_tokens": 20463744} +{"current_steps": 31080, "total_steps": 33920, "loss": 0.3473, "lr": 2.1217285485422622e-07, "epoch": 18.32547169811321, "percentage": 91.63, "elapsed_time": "1:00:21", "remaining_time": "0:05:30", "throughput": 5652.02, "total_tokens": 20466784} +{"current_steps": 31085, "total_steps": 33920, "loss": 0.1903, "lr": 2.114319913764268e-07, "epoch": 18.328419811320753, "percentage": 91.64, "elapsed_time": "1:00:21", "remaining_time": "0:05:30", "throughput": 5652.06, "total_tokens": 20470784} +{"current_steps": 31090, "total_steps": 33920, "loss": 0.3881, "lr": 2.10692395692646e-07, "epoch": 18.3313679245283, "percentage": 91.66, "elapsed_time": "1:00:22", "remaining_time": "0:05:29", "throughput": 5652.0, "total_tokens": 20473568} +{"current_steps": 31095, "total_steps": 33920, "loss": 0.2965, "lr": 2.0995406799869444e-07, "epoch": 18.33431603773585, "percentage": 91.67, "elapsed_time": "1:00:22", "remaining_time": "0:05:29", "throughput": 5652.07, "total_tokens": 20476896} +{"current_steps": 31100, "total_steps": 33920, "loss": 0.3841, "lr": 2.0921700849004743e-07, "epoch": 18.337264150943398, "percentage": 91.69, "elapsed_time": "1:00:23", "remaining_time": "0:05:28", "throughput": 5652.09, "total_tokens": 20480288} +{"current_steps": 31105, "total_steps": 33920, "loss": 0.3356, "lr": 2.084812173618439e-07, "epoch": 18.340212264150942, "percentage": 91.7, "elapsed_time": "1:00:24", "remaining_time": "0:05:27", "throughput": 5652.13, "total_tokens": 20483456} +{"current_steps": 31110, "total_steps": 33920, "loss": 0.2546, "lr": 2.0774669480888853e-07, "epoch": 18.34316037735849, "percentage": 91.72, "elapsed_time": "1:00:24", "remaining_time": "0:05:27", "throughput": 5652.02, "total_tokens": 20486048} +{"current_steps": 31115, "total_steps": 33920, "loss": 0.2331, "lr": 2.0701344102564912e-07, "epoch": 18.34610849056604, "percentage": 91.73, "elapsed_time": "1:00:25", "remaining_time": "0:05:26", "throughput": 5652.02, "total_tokens": 20489216} +{"current_steps": 31120, "total_steps": 33920, "loss": 0.2636, "lr": 2.062814562062576e-07, "epoch": 18.349056603773583, "percentage": 91.75, "elapsed_time": "1:00:25", "remaining_time": "0:05:26", "throughput": 5652.04, "total_tokens": 20492576} +{"current_steps": 31125, "total_steps": 33920, "loss": 0.3102, "lr": 2.0555074054451063e-07, "epoch": 18.35200471698113, "percentage": 91.76, "elapsed_time": "1:00:26", "remaining_time": "0:05:25", "throughput": 5652.03, "total_tokens": 20496032} +{"current_steps": 31130, "total_steps": 33920, "loss": 0.2613, "lr": 2.0482129423386843e-07, "epoch": 18.35495283018868, "percentage": 91.77, "elapsed_time": "1:00:26", "remaining_time": "0:05:25", "throughput": 5651.97, "total_tokens": 20499008} +{"current_steps": 31135, "total_steps": 33920, "loss": 0.2769, "lr": 2.040931174674543e-07, "epoch": 18.357900943396228, "percentage": 91.79, "elapsed_time": "1:00:27", "remaining_time": "0:05:24", "throughput": 5652.12, "total_tokens": 20503584} +{"current_steps": 31140, "total_steps": 33920, "loss": 0.268, "lr": 2.0336621043805682e-07, "epoch": 18.360849056603772, "percentage": 91.8, "elapsed_time": "1:00:28", "remaining_time": "0:05:23", "throughput": 5652.18, "total_tokens": 20507264} +{"current_steps": 31145, "total_steps": 33920, "loss": 0.2399, "lr": 2.0264057333812704e-07, "epoch": 18.36379716981132, "percentage": 91.82, "elapsed_time": "1:00:28", "remaining_time": "0:05:23", "throughput": 5652.03, "total_tokens": 20509728} +{"current_steps": 31150, "total_steps": 33920, "loss": 0.3001, "lr": 2.0191620635978127e-07, "epoch": 18.36674528301887, "percentage": 91.83, "elapsed_time": "1:00:29", "remaining_time": "0:05:22", "throughput": 5651.99, "total_tokens": 20512480} +{"current_steps": 31155, "total_steps": 33920, "loss": 0.3345, "lr": 2.0119310969479833e-07, "epoch": 18.369693396226417, "percentage": 91.85, "elapsed_time": "1:00:29", "remaining_time": "0:05:22", "throughput": 5651.96, "total_tokens": 20515520} +{"current_steps": 31160, "total_steps": 33920, "loss": 0.2886, "lr": 2.004712835346212e-07, "epoch": 18.37264150943396, "percentage": 91.86, "elapsed_time": "1:00:30", "remaining_time": "0:05:21", "throughput": 5651.84, "total_tokens": 20518400} +{"current_steps": 31165, "total_steps": 33920, "loss": 0.2344, "lr": 1.99750728070357e-07, "epoch": 18.37558962264151, "percentage": 91.88, "elapsed_time": "1:00:30", "remaining_time": "0:05:20", "throughput": 5651.94, "total_tokens": 20522048} +{"current_steps": 31170, "total_steps": 33920, "loss": 0.3083, "lr": 1.9903144349277536e-07, "epoch": 18.378537735849058, "percentage": 91.89, "elapsed_time": "1:00:31", "remaining_time": "0:05:20", "throughput": 5651.89, "total_tokens": 20525312} +{"current_steps": 31175, "total_steps": 33920, "loss": 0.316, "lr": 1.983134299923095e-07, "epoch": 18.381485849056602, "percentage": 91.91, "elapsed_time": "1:00:32", "remaining_time": "0:05:19", "throughput": 5651.85, "total_tokens": 20528480} +{"current_steps": 31180, "total_steps": 33920, "loss": 0.1829, "lr": 1.9759668775905737e-07, "epoch": 18.38443396226415, "percentage": 91.92, "elapsed_time": "1:00:33", "remaining_time": "0:05:19", "throughput": 5652.04, "total_tokens": 20534944} +{"current_steps": 31185, "total_steps": 33920, "loss": 0.2321, "lr": 1.9688121698277995e-07, "epoch": 18.3873820754717, "percentage": 91.94, "elapsed_time": "1:00:33", "remaining_time": "0:05:18", "throughput": 5651.95, "total_tokens": 20537568} +{"current_steps": 31190, "total_steps": 33920, "loss": 0.2692, "lr": 1.9616701785290015e-07, "epoch": 18.390330188679247, "percentage": 91.95, "elapsed_time": "1:00:34", "remaining_time": "0:05:18", "throughput": 5652.02, "total_tokens": 20541248} +{"current_steps": 31195, "total_steps": 33920, "loss": 0.3523, "lr": 1.954540905585056e-07, "epoch": 18.39327830188679, "percentage": 91.97, "elapsed_time": "1:00:34", "remaining_time": "0:05:17", "throughput": 5652.06, "total_tokens": 20544384} +{"current_steps": 31200, "total_steps": 33920, "loss": 0.3126, "lr": 1.9474243528834757e-07, "epoch": 18.39622641509434, "percentage": 91.98, "elapsed_time": "1:00:35", "remaining_time": "0:05:16", "throughput": 5652.15, "total_tokens": 20548096} +{"current_steps": 31205, "total_steps": 33920, "loss": 0.2781, "lr": 1.9403205223083866e-07, "epoch": 18.399174528301888, "percentage": 92.0, "elapsed_time": "1:00:35", "remaining_time": "0:05:16", "throughput": 5652.2, "total_tokens": 20551328} +{"current_steps": 31210, "total_steps": 33920, "loss": 0.3699, "lr": 1.9332294157405619e-07, "epoch": 18.402122641509433, "percentage": 92.01, "elapsed_time": "1:00:36", "remaining_time": "0:05:15", "throughput": 5652.32, "total_tokens": 20555680} +{"current_steps": 31215, "total_steps": 33920, "loss": 0.2894, "lr": 1.926151035057411e-07, "epoch": 18.40507075471698, "percentage": 92.03, "elapsed_time": "1:00:37", "remaining_time": "0:05:15", "throughput": 5652.47, "total_tokens": 20559680} +{"current_steps": 31220, "total_steps": 33920, "loss": 0.3567, "lr": 1.9190853821329626e-07, "epoch": 18.40801886792453, "percentage": 92.04, "elapsed_time": "1:00:37", "remaining_time": "0:05:14", "throughput": 5652.47, "total_tokens": 20563136} +{"current_steps": 31225, "total_steps": 33920, "loss": 0.2883, "lr": 1.9120324588378757e-07, "epoch": 18.410966981132077, "percentage": 92.05, "elapsed_time": "1:00:38", "remaining_time": "0:05:14", "throughput": 5652.48, "total_tokens": 20566272} +{"current_steps": 31230, "total_steps": 33920, "loss": 0.301, "lr": 1.9049922670394461e-07, "epoch": 18.41391509433962, "percentage": 92.07, "elapsed_time": "1:00:38", "remaining_time": "0:05:13", "throughput": 5652.48, "total_tokens": 20569312} +{"current_steps": 31235, "total_steps": 33920, "loss": 0.2339, "lr": 1.897964808601588e-07, "epoch": 18.41686320754717, "percentage": 92.08, "elapsed_time": "1:00:39", "remaining_time": "0:05:12", "throughput": 5652.45, "total_tokens": 20572224} +{"current_steps": 31240, "total_steps": 33920, "loss": 0.2335, "lr": 1.8909500853848517e-07, "epoch": 18.419811320754718, "percentage": 92.1, "elapsed_time": "1:00:40", "remaining_time": "0:05:12", "throughput": 5652.33, "total_tokens": 20574816} +{"current_steps": 31245, "total_steps": 33920, "loss": 0.3102, "lr": 1.8839480992464243e-07, "epoch": 18.422759433962263, "percentage": 92.11, "elapsed_time": "1:00:40", "remaining_time": "0:05:11", "throughput": 5652.26, "total_tokens": 20577920} +{"current_steps": 31250, "total_steps": 33920, "loss": 0.3214, "lr": 1.8769588520401005e-07, "epoch": 18.42570754716981, "percentage": 92.13, "elapsed_time": "1:00:41", "remaining_time": "0:05:11", "throughput": 5652.18, "total_tokens": 20580672} +{"current_steps": 31255, "total_steps": 33920, "loss": 0.2898, "lr": 1.8699823456163279e-07, "epoch": 18.42865566037736, "percentage": 92.14, "elapsed_time": "1:00:41", "remaining_time": "0:05:10", "throughput": 5652.1, "total_tokens": 20583392} +{"current_steps": 31260, "total_steps": 33920, "loss": 0.3057, "lr": 1.8630185818221514e-07, "epoch": 18.431603773584907, "percentage": 92.16, "elapsed_time": "1:00:42", "remaining_time": "0:05:09", "throughput": 5652.16, "total_tokens": 20586688} +{"current_steps": 31265, "total_steps": 33920, "loss": 0.3355, "lr": 1.856067562501268e-07, "epoch": 18.434551886792452, "percentage": 92.17, "elapsed_time": "1:00:42", "remaining_time": "0:05:09", "throughput": 5652.2, "total_tokens": 20590272} +{"current_steps": 31270, "total_steps": 33920, "loss": 0.2169, "lr": 1.8491292894939837e-07, "epoch": 18.4375, "percentage": 92.19, "elapsed_time": "1:00:43", "remaining_time": "0:05:08", "throughput": 5652.38, "total_tokens": 20594976} +{"current_steps": 31275, "total_steps": 33920, "loss": 0.255, "lr": 1.8422037646372405e-07, "epoch": 18.440448113207548, "percentage": 92.2, "elapsed_time": "1:00:44", "remaining_time": "0:05:08", "throughput": 5652.52, "total_tokens": 20599040} +{"current_steps": 31280, "total_steps": 33920, "loss": 0.4638, "lr": 1.8352909897645989e-07, "epoch": 18.443396226415093, "percentage": 92.22, "elapsed_time": "1:00:44", "remaining_time": "0:05:07", "throughput": 5652.41, "total_tokens": 20601600} +{"current_steps": 31285, "total_steps": 33920, "loss": 0.2314, "lr": 1.8283909667062448e-07, "epoch": 18.44634433962264, "percentage": 92.23, "elapsed_time": "1:00:45", "remaining_time": "0:05:07", "throughput": 5652.56, "total_tokens": 20605376} +{"current_steps": 31290, "total_steps": 33920, "loss": 0.3108, "lr": 1.82150369728899e-07, "epoch": 18.44929245283019, "percentage": 92.25, "elapsed_time": "1:00:45", "remaining_time": "0:05:06", "throughput": 5652.72, "total_tokens": 20609440} +{"current_steps": 31295, "total_steps": 33920, "loss": 0.5015, "lr": 1.814629183336275e-07, "epoch": 18.452240566037737, "percentage": 92.26, "elapsed_time": "1:00:46", "remaining_time": "0:05:05", "throughput": 5652.73, "total_tokens": 20612672} +{"current_steps": 31300, "total_steps": 33920, "loss": 0.3402, "lr": 1.807767426668139e-07, "epoch": 18.455188679245282, "percentage": 92.28, "elapsed_time": "1:00:47", "remaining_time": "0:05:05", "throughput": 5652.75, "total_tokens": 20615744} +{"current_steps": 31305, "total_steps": 33920, "loss": 0.3054, "lr": 1.8009184291012783e-07, "epoch": 18.45813679245283, "percentage": 92.29, "elapsed_time": "1:00:47", "remaining_time": "0:05:04", "throughput": 5652.63, "total_tokens": 20618336} +{"current_steps": 31310, "total_steps": 33920, "loss": 0.2605, "lr": 1.7940821924489926e-07, "epoch": 18.46108490566038, "percentage": 92.31, "elapsed_time": "1:00:48", "remaining_time": "0:05:04", "throughput": 5652.61, "total_tokens": 20621472} +{"current_steps": 31315, "total_steps": 33920, "loss": 0.2885, "lr": 1.7872587185212009e-07, "epoch": 18.464033018867923, "percentage": 92.32, "elapsed_time": "1:00:48", "remaining_time": "0:05:03", "throughput": 5652.55, "total_tokens": 20624352} +{"current_steps": 31320, "total_steps": 33920, "loss": 0.1905, "lr": 1.7804480091244524e-07, "epoch": 18.46698113207547, "percentage": 92.33, "elapsed_time": "1:00:49", "remaining_time": "0:05:02", "throughput": 5652.54, "total_tokens": 20627136} +{"current_steps": 31325, "total_steps": 33920, "loss": 0.144, "lr": 1.7736500660619104e-07, "epoch": 18.46992924528302, "percentage": 92.35, "elapsed_time": "1:00:49", "remaining_time": "0:05:02", "throughput": 5652.69, "total_tokens": 20630976} +{"current_steps": 31330, "total_steps": 33920, "loss": 0.4279, "lr": 1.766864891133352e-07, "epoch": 18.472877358490567, "percentage": 92.36, "elapsed_time": "1:00:50", "remaining_time": "0:05:01", "throughput": 5652.59, "total_tokens": 20633568} +{"current_steps": 31335, "total_steps": 33920, "loss": 0.3558, "lr": 1.7600924861351843e-07, "epoch": 18.475825471698112, "percentage": 92.38, "elapsed_time": "1:00:50", "remaining_time": "0:05:01", "throughput": 5652.66, "total_tokens": 20636992} +{"current_steps": 31340, "total_steps": 33920, "loss": 0.2553, "lr": 1.7533328528604398e-07, "epoch": 18.47877358490566, "percentage": 92.39, "elapsed_time": "1:00:51", "remaining_time": "0:05:00", "throughput": 5652.62, "total_tokens": 20640032} +{"current_steps": 31345, "total_steps": 33920, "loss": 0.3101, "lr": 1.746585993098754e-07, "epoch": 18.48172169811321, "percentage": 92.41, "elapsed_time": "1:00:51", "remaining_time": "0:05:00", "throughput": 5652.49, "total_tokens": 20642688} +{"current_steps": 31350, "total_steps": 33920, "loss": 0.2545, "lr": 1.7398519086363864e-07, "epoch": 18.484669811320753, "percentage": 92.42, "elapsed_time": "1:00:52", "remaining_time": "0:04:59", "throughput": 5652.56, "total_tokens": 20646528} +{"current_steps": 31355, "total_steps": 33920, "loss": 0.3438, "lr": 1.733130601256211e-07, "epoch": 18.4876179245283, "percentage": 92.44, "elapsed_time": "1:00:53", "remaining_time": "0:04:58", "throughput": 5652.46, "total_tokens": 20649376} +{"current_steps": 31360, "total_steps": 33920, "loss": 0.3083, "lr": 1.7264220727377323e-07, "epoch": 18.49056603773585, "percentage": 92.45, "elapsed_time": "1:00:53", "remaining_time": "0:04:58", "throughput": 5652.41, "total_tokens": 20652448} +{"current_steps": 31365, "total_steps": 33920, "loss": 0.1776, "lr": 1.7197263248570517e-07, "epoch": 18.493514150943398, "percentage": 92.47, "elapsed_time": "1:00:54", "remaining_time": "0:04:57", "throughput": 5652.44, "total_tokens": 20655680} +{"current_steps": 31370, "total_steps": 33920, "loss": 0.2724, "lr": 1.7130433593869124e-07, "epoch": 18.496462264150942, "percentage": 92.48, "elapsed_time": "1:00:54", "remaining_time": "0:04:57", "throughput": 5652.44, "total_tokens": 20658592} +{"current_steps": 31375, "total_steps": 33920, "loss": 0.3661, "lr": 1.706373178096643e-07, "epoch": 18.49941037735849, "percentage": 92.5, "elapsed_time": "1:00:55", "remaining_time": "0:04:56", "throughput": 5652.48, "total_tokens": 20661760} +{"current_steps": 31380, "total_steps": 33920, "loss": 0.3047, "lr": 1.6997157827522092e-07, "epoch": 18.50235849056604, "percentage": 92.51, "elapsed_time": "1:00:55", "remaining_time": "0:04:55", "throughput": 5652.47, "total_tokens": 20664928} +{"current_steps": 31385, "total_steps": 33920, "loss": 0.3332, "lr": 1.6930711751161843e-07, "epoch": 18.505306603773583, "percentage": 92.53, "elapsed_time": "1:00:56", "remaining_time": "0:04:55", "throughput": 5652.68, "total_tokens": 20669152} +{"current_steps": 31390, "total_steps": 33920, "loss": 0.4271, "lr": 1.6864393569477556e-07, "epoch": 18.50825471698113, "percentage": 92.54, "elapsed_time": "1:00:57", "remaining_time": "0:04:54", "throughput": 5652.72, "total_tokens": 20672448} +{"current_steps": 31395, "total_steps": 33920, "loss": 0.2415, "lr": 1.6798203300027295e-07, "epoch": 18.51120283018868, "percentage": 92.56, "elapsed_time": "1:00:57", "remaining_time": "0:04:54", "throughput": 5652.68, "total_tokens": 20675296} +{"current_steps": 31400, "total_steps": 33920, "loss": 0.1918, "lr": 1.6732140960335152e-07, "epoch": 18.514150943396228, "percentage": 92.57, "elapsed_time": "1:00:58", "remaining_time": "0:04:53", "throughput": 5652.65, "total_tokens": 20678368} +{"current_steps": 31405, "total_steps": 33920, "loss": 0.219, "lr": 1.666620656789153e-07, "epoch": 18.517099056603772, "percentage": 92.59, "elapsed_time": "1:00:58", "remaining_time": "0:04:53", "throughput": 5652.54, "total_tokens": 20681088} +{"current_steps": 31410, "total_steps": 33920, "loss": 0.3178, "lr": 1.660040014015274e-07, "epoch": 18.52004716981132, "percentage": 92.6, "elapsed_time": "1:00:59", "remaining_time": "0:04:52", "throughput": 5652.59, "total_tokens": 20684800} +{"current_steps": 31415, "total_steps": 33920, "loss": 0.3978, "lr": 1.6534721694541344e-07, "epoch": 18.52299528301887, "percentage": 92.61, "elapsed_time": "1:00:59", "remaining_time": "0:04:51", "throughput": 5652.68, "total_tokens": 20688384} +{"current_steps": 31420, "total_steps": 33920, "loss": 0.2508, "lr": 1.6469171248445993e-07, "epoch": 18.525943396226417, "percentage": 92.63, "elapsed_time": "1:01:00", "remaining_time": "0:04:51", "throughput": 5652.69, "total_tokens": 20691456} +{"current_steps": 31425, "total_steps": 33920, "loss": 0.2799, "lr": 1.6403748819221464e-07, "epoch": 18.52889150943396, "percentage": 92.64, "elapsed_time": "1:01:01", "remaining_time": "0:04:50", "throughput": 5652.73, "total_tokens": 20694912} +{"current_steps": 31430, "total_steps": 33920, "loss": 0.3064, "lr": 1.6338454424188632e-07, "epoch": 18.53183962264151, "percentage": 92.66, "elapsed_time": "1:01:01", "remaining_time": "0:04:50", "throughput": 5652.74, "total_tokens": 20698848} +{"current_steps": 31435, "total_steps": 33920, "loss": 0.3453, "lr": 1.6273288080634442e-07, "epoch": 18.534787735849058, "percentage": 92.67, "elapsed_time": "1:01:02", "remaining_time": "0:04:49", "throughput": 5652.91, "total_tokens": 20702816} +{"current_steps": 31440, "total_steps": 33920, "loss": 0.3503, "lr": 1.6208249805811982e-07, "epoch": 18.537735849056602, "percentage": 92.69, "elapsed_time": "1:01:02", "remaining_time": "0:04:48", "throughput": 5653.05, "total_tokens": 20706720} +{"current_steps": 31445, "total_steps": 33920, "loss": 0.3267, "lr": 1.6143339616940423e-07, "epoch": 18.54068396226415, "percentage": 92.7, "elapsed_time": "1:01:03", "remaining_time": "0:04:48", "throughput": 5652.95, "total_tokens": 20709376} +{"current_steps": 31450, "total_steps": 33920, "loss": 0.3574, "lr": 1.6078557531205018e-07, "epoch": 18.5436320754717, "percentage": 92.72, "elapsed_time": "1:01:04", "remaining_time": "0:04:47", "throughput": 5653.01, "total_tokens": 20713216} +{"current_steps": 31455, "total_steps": 33920, "loss": 0.2175, "lr": 1.601390356575705e-07, "epoch": 18.546580188679247, "percentage": 92.73, "elapsed_time": "1:01:04", "remaining_time": "0:04:47", "throughput": 5652.89, "total_tokens": 20715936} +{"current_steps": 31460, "total_steps": 33920, "loss": 0.2481, "lr": 1.5949377737713988e-07, "epoch": 18.54952830188679, "percentage": 92.75, "elapsed_time": "1:01:05", "remaining_time": "0:04:46", "throughput": 5652.91, "total_tokens": 20719296} +{"current_steps": 31465, "total_steps": 33920, "loss": 0.3427, "lr": 1.5884980064159338e-07, "epoch": 18.55247641509434, "percentage": 92.76, "elapsed_time": "1:01:05", "remaining_time": "0:04:46", "throughput": 5652.86, "total_tokens": 20722144} +{"current_steps": 31470, "total_steps": 33920, "loss": 0.3431, "lr": 1.5820710562142627e-07, "epoch": 18.555424528301888, "percentage": 92.78, "elapsed_time": "1:01:06", "remaining_time": "0:04:45", "throughput": 5652.93, "total_tokens": 20725568} +{"current_steps": 31475, "total_steps": 33920, "loss": 0.372, "lr": 1.575656924867952e-07, "epoch": 18.558372641509433, "percentage": 92.79, "elapsed_time": "1:01:06", "remaining_time": "0:04:44", "throughput": 5652.92, "total_tokens": 20728480} +{"current_steps": 31480, "total_steps": 33920, "loss": 0.2229, "lr": 1.5692556140751658e-07, "epoch": 18.56132075471698, "percentage": 92.81, "elapsed_time": "1:01:07", "remaining_time": "0:04:44", "throughput": 5652.97, "total_tokens": 20733504} +{"current_steps": 31485, "total_steps": 33920, "loss": 0.1943, "lr": 1.5628671255306706e-07, "epoch": 18.56426886792453, "percentage": 92.82, "elapsed_time": "1:01:08", "remaining_time": "0:04:43", "throughput": 5653.15, "total_tokens": 20738848} +{"current_steps": 31490, "total_steps": 33920, "loss": 0.2849, "lr": 1.556491460925863e-07, "epoch": 18.567216981132077, "percentage": 92.84, "elapsed_time": "1:01:09", "remaining_time": "0:04:43", "throughput": 5653.16, "total_tokens": 20742080} +{"current_steps": 31495, "total_steps": 33920, "loss": 0.3311, "lr": 1.550128621948721e-07, "epoch": 18.57016509433962, "percentage": 92.85, "elapsed_time": "1:01:09", "remaining_time": "0:04:42", "throughput": 5653.05, "total_tokens": 20744832} +{"current_steps": 31500, "total_steps": 33920, "loss": 0.2841, "lr": 1.5437786102838413e-07, "epoch": 18.57311320754717, "percentage": 92.87, "elapsed_time": "1:01:10", "remaining_time": "0:04:41", "throughput": 5653.04, "total_tokens": 20748064} +{"current_steps": 31505, "total_steps": 33920, "loss": 0.2131, "lr": 1.5374414276124017e-07, "epoch": 18.576061320754718, "percentage": 92.88, "elapsed_time": "1:01:10", "remaining_time": "0:04:41", "throughput": 5653.05, "total_tokens": 20751136} +{"current_steps": 31510, "total_steps": 33920, "loss": 0.2703, "lr": 1.5311170756122095e-07, "epoch": 18.579009433962263, "percentage": 92.9, "elapsed_time": "1:01:11", "remaining_time": "0:04:40", "throughput": 5653.18, "total_tokens": 20755072} +{"current_steps": 31515, "total_steps": 33920, "loss": 0.2238, "lr": 1.5248055559576647e-07, "epoch": 18.58195754716981, "percentage": 92.91, "elapsed_time": "1:01:11", "remaining_time": "0:04:40", "throughput": 5653.09, "total_tokens": 20757728} +{"current_steps": 31520, "total_steps": 33920, "loss": 0.2602, "lr": 1.5185068703197526e-07, "epoch": 18.58490566037736, "percentage": 92.92, "elapsed_time": "1:01:12", "remaining_time": "0:04:39", "throughput": 5653.08, "total_tokens": 20760960} +{"current_steps": 31525, "total_steps": 33920, "loss": 0.3476, "lr": 1.5122210203661004e-07, "epoch": 18.587853773584907, "percentage": 92.94, "elapsed_time": "1:01:13", "remaining_time": "0:04:39", "throughput": 5653.07, "total_tokens": 20763968} +{"current_steps": 31530, "total_steps": 33920, "loss": 0.3324, "lr": 1.505948007760899e-07, "epoch": 18.590801886792452, "percentage": 92.95, "elapsed_time": "1:01:13", "remaining_time": "0:04:38", "throughput": 5653.12, "total_tokens": 20767296} +{"current_steps": 31535, "total_steps": 33920, "loss": 0.2508, "lr": 1.4996878341649647e-07, "epoch": 18.59375, "percentage": 92.97, "elapsed_time": "1:01:14", "remaining_time": "0:04:37", "throughput": 5653.11, "total_tokens": 20770304} +{"current_steps": 31540, "total_steps": 33920, "loss": 0.2714, "lr": 1.493440501235699e-07, "epoch": 18.596698113207548, "percentage": 92.98, "elapsed_time": "1:01:14", "remaining_time": "0:04:37", "throughput": 5653.2, "total_tokens": 20774144} +{"current_steps": 31545, "total_steps": 33920, "loss": 0.3096, "lr": 1.487206010627118e-07, "epoch": 18.599646226415093, "percentage": 93.0, "elapsed_time": "1:01:15", "remaining_time": "0:04:36", "throughput": 5653.11, "total_tokens": 20776704} +{"current_steps": 31550, "total_steps": 33920, "loss": 0.1854, "lr": 1.4809843639898124e-07, "epoch": 18.60259433962264, "percentage": 93.01, "elapsed_time": "1:01:15", "remaining_time": "0:04:36", "throughput": 5652.89, "total_tokens": 20778816} +{"current_steps": 31555, "total_steps": 33920, "loss": 0.2772, "lr": 1.4747755629710093e-07, "epoch": 18.60554245283019, "percentage": 93.03, "elapsed_time": "1:01:16", "remaining_time": "0:04:35", "throughput": 5652.81, "total_tokens": 20782144} +{"current_steps": 31560, "total_steps": 33920, "loss": 0.2522, "lr": 1.4685796092145045e-07, "epoch": 18.608490566037737, "percentage": 93.04, "elapsed_time": "1:01:17", "remaining_time": "0:04:34", "throughput": 5652.89, "total_tokens": 20785824} +{"current_steps": 31565, "total_steps": 33920, "loss": 0.1991, "lr": 1.4623965043607135e-07, "epoch": 18.611438679245282, "percentage": 93.06, "elapsed_time": "1:01:17", "remaining_time": "0:04:34", "throughput": 5652.8, "total_tokens": 20788512} +{"current_steps": 31570, "total_steps": 33920, "loss": 0.2738, "lr": 1.4562262500466273e-07, "epoch": 18.61438679245283, "percentage": 93.07, "elapsed_time": "1:01:18", "remaining_time": "0:04:33", "throughput": 5652.7, "total_tokens": 20791072} +{"current_steps": 31575, "total_steps": 33920, "loss": 0.3125, "lr": 1.4500688479058556e-07, "epoch": 18.61733490566038, "percentage": 93.09, "elapsed_time": "1:01:18", "remaining_time": "0:04:33", "throughput": 5652.7, "total_tokens": 20794112} +{"current_steps": 31580, "total_steps": 33920, "loss": 0.3096, "lr": 1.4439242995685943e-07, "epoch": 18.620283018867923, "percentage": 93.1, "elapsed_time": "1:01:19", "remaining_time": "0:04:32", "throughput": 5652.7, "total_tokens": 20797600} +{"current_steps": 31585, "total_steps": 33920, "loss": 0.3893, "lr": 1.4377926066616364e-07, "epoch": 18.62323113207547, "percentage": 93.12, "elapsed_time": "1:01:19", "remaining_time": "0:04:32", "throughput": 5652.72, "total_tokens": 20800640} +{"current_steps": 31590, "total_steps": 33920, "loss": 0.238, "lr": 1.4316737708083783e-07, "epoch": 18.62617924528302, "percentage": 93.13, "elapsed_time": "1:01:20", "remaining_time": "0:04:31", "throughput": 5652.79, "total_tokens": 20804384} +{"current_steps": 31595, "total_steps": 33920, "loss": 0.3017, "lr": 1.4255677936288127e-07, "epoch": 18.629127358490567, "percentage": 93.15, "elapsed_time": "1:01:20", "remaining_time": "0:04:30", "throughput": 5652.78, "total_tokens": 20807456} +{"current_steps": 31600, "total_steps": 33920, "loss": 0.3664, "lr": 1.4194746767395184e-07, "epoch": 18.632075471698112, "percentage": 93.16, "elapsed_time": "1:01:21", "remaining_time": "0:04:30", "throughput": 5652.7, "total_tokens": 20810176} +{"current_steps": 31605, "total_steps": 33920, "loss": 0.2649, "lr": 1.4133944217536722e-07, "epoch": 18.63502358490566, "percentage": 93.18, "elapsed_time": "1:01:22", "remaining_time": "0:04:29", "throughput": 5652.63, "total_tokens": 20812992} +{"current_steps": 31610, "total_steps": 33920, "loss": 0.2098, "lr": 1.4073270302810471e-07, "epoch": 18.63797169811321, "percentage": 93.19, "elapsed_time": "1:01:22", "remaining_time": "0:04:29", "throughput": 5652.71, "total_tokens": 20816576} +{"current_steps": 31615, "total_steps": 33920, "loss": 0.2744, "lr": 1.4012725039280084e-07, "epoch": 18.640919811320753, "percentage": 93.2, "elapsed_time": "1:01:23", "remaining_time": "0:04:28", "throughput": 5652.74, "total_tokens": 20819808} +{"current_steps": 31620, "total_steps": 33920, "loss": 0.2978, "lr": 1.3952308442975292e-07, "epoch": 18.6438679245283, "percentage": 93.22, "elapsed_time": "1:01:23", "remaining_time": "0:04:27", "throughput": 5652.87, "total_tokens": 20823552} +{"current_steps": 31625, "total_steps": 33920, "loss": 0.2867, "lr": 1.3892020529891637e-07, "epoch": 18.64681603773585, "percentage": 93.23, "elapsed_time": "1:01:24", "remaining_time": "0:04:27", "throughput": 5652.89, "total_tokens": 20826880} +{"current_steps": 31630, "total_steps": 33920, "loss": 0.3328, "lr": 1.3831861315990514e-07, "epoch": 18.649764150943398, "percentage": 93.25, "elapsed_time": "1:01:24", "remaining_time": "0:04:26", "throughput": 5652.69, "total_tokens": 20829184} +{"current_steps": 31635, "total_steps": 33920, "loss": 0.2415, "lr": 1.377183081719935e-07, "epoch": 18.652712264150942, "percentage": 93.26, "elapsed_time": "1:01:25", "remaining_time": "0:04:26", "throughput": 5652.61, "total_tokens": 20831808} +{"current_steps": 31640, "total_steps": 33920, "loss": 0.2325, "lr": 1.3711929049411544e-07, "epoch": 18.65566037735849, "percentage": 93.28, "elapsed_time": "1:01:25", "remaining_time": "0:04:25", "throughput": 5652.66, "total_tokens": 20835328} +{"current_steps": 31645, "total_steps": 33920, "loss": 0.2208, "lr": 1.365215602848624e-07, "epoch": 18.65860849056604, "percentage": 93.29, "elapsed_time": "1:01:26", "remaining_time": "0:04:25", "throughput": 5652.67, "total_tokens": 20838464} +{"current_steps": 31650, "total_steps": 33920, "loss": 0.2708, "lr": 1.3592511770248727e-07, "epoch": 18.661556603773583, "percentage": 93.31, "elapsed_time": "1:01:26", "remaining_time": "0:04:24", "throughput": 5652.7, "total_tokens": 20841472} +{"current_steps": 31655, "total_steps": 33920, "loss": 0.3102, "lr": 1.3532996290490041e-07, "epoch": 18.66450471698113, "percentage": 93.32, "elapsed_time": "1:01:27", "remaining_time": "0:04:23", "throughput": 5652.59, "total_tokens": 20844128} +{"current_steps": 31660, "total_steps": 33920, "loss": 0.313, "lr": 1.347360960496713e-07, "epoch": 18.66745283018868, "percentage": 93.34, "elapsed_time": "1:01:28", "remaining_time": "0:04:23", "throughput": 5652.59, "total_tokens": 20847424} +{"current_steps": 31665, "total_steps": 33920, "loss": 0.2812, "lr": 1.3414351729402862e-07, "epoch": 18.670400943396228, "percentage": 93.35, "elapsed_time": "1:01:28", "remaining_time": "0:04:22", "throughput": 5652.73, "total_tokens": 20851616} +{"current_steps": 31670, "total_steps": 33920, "loss": 0.3361, "lr": 1.3355222679486025e-07, "epoch": 18.673349056603772, "percentage": 93.37, "elapsed_time": "1:01:29", "remaining_time": "0:04:22", "throughput": 5652.74, "total_tokens": 20854880} +{"current_steps": 31675, "total_steps": 33920, "loss": 0.3138, "lr": 1.3296222470871367e-07, "epoch": 18.67629716981132, "percentage": 93.38, "elapsed_time": "1:01:29", "remaining_time": "0:04:21", "throughput": 5652.75, "total_tokens": 20857888} +{"current_steps": 31680, "total_steps": 33920, "loss": 0.2537, "lr": 1.3237351119179287e-07, "epoch": 18.67924528301887, "percentage": 93.4, "elapsed_time": "1:01:30", "remaining_time": "0:04:20", "throughput": 5652.85, "total_tokens": 20861536} +{"current_steps": 31685, "total_steps": 33920, "loss": 0.2684, "lr": 1.3178608639996425e-07, "epoch": 18.682193396226417, "percentage": 93.41, "elapsed_time": "1:01:30", "remaining_time": "0:04:20", "throughput": 5652.96, "total_tokens": 20865024} +{"current_steps": 31690, "total_steps": 33920, "loss": 0.2398, "lr": 1.3119995048874957e-07, "epoch": 18.68514150943396, "percentage": 93.43, "elapsed_time": "1:01:31", "remaining_time": "0:04:19", "throughput": 5653.04, "total_tokens": 20868480} +{"current_steps": 31695, "total_steps": 33920, "loss": 0.2951, "lr": 1.3061510361333186e-07, "epoch": 18.68808962264151, "percentage": 93.44, "elapsed_time": "1:01:32", "remaining_time": "0:04:19", "throughput": 5652.97, "total_tokens": 20871200} +{"current_steps": 31700, "total_steps": 33920, "loss": 0.3776, "lr": 1.3003154592855116e-07, "epoch": 18.691037735849058, "percentage": 93.46, "elapsed_time": "1:01:32", "remaining_time": "0:04:18", "throughput": 5653.12, "total_tokens": 20875584} +{"current_steps": 31705, "total_steps": 33920, "loss": 0.3801, "lr": 1.2944927758890668e-07, "epoch": 18.693985849056602, "percentage": 93.47, "elapsed_time": "1:01:33", "remaining_time": "0:04:18", "throughput": 5653.04, "total_tokens": 20878368} +{"current_steps": 31710, "total_steps": 33920, "loss": 0.3346, "lr": 1.2886829874855733e-07, "epoch": 18.69693396226415, "percentage": 93.48, "elapsed_time": "1:01:33", "remaining_time": "0:04:17", "throughput": 5652.97, "total_tokens": 20881056} +{"current_steps": 31715, "total_steps": 33920, "loss": 0.3651, "lr": 1.2828860956131894e-07, "epoch": 18.6998820754717, "percentage": 93.5, "elapsed_time": "1:01:34", "remaining_time": "0:04:16", "throughput": 5652.85, "total_tokens": 20883552} +{"current_steps": 31720, "total_steps": 33920, "loss": 0.4373, "lr": 1.2771021018066765e-07, "epoch": 18.702830188679247, "percentage": 93.51, "elapsed_time": "1:01:34", "remaining_time": "0:04:16", "throughput": 5653.01, "total_tokens": 20887328} +{"current_steps": 31725, "total_steps": 33920, "loss": 0.3102, "lr": 1.271331007597365e-07, "epoch": 18.70577830188679, "percentage": 93.53, "elapsed_time": "1:01:35", "remaining_time": "0:04:15", "throughput": 5652.88, "total_tokens": 20889984} +{"current_steps": 31730, "total_steps": 33920, "loss": 0.3166, "lr": 1.2655728145131774e-07, "epoch": 18.70872641509434, "percentage": 93.54, "elapsed_time": "1:01:36", "remaining_time": "0:04:15", "throughput": 5652.82, "total_tokens": 20892864} +{"current_steps": 31735, "total_steps": 33920, "loss": 0.3619, "lr": 1.2598275240786105e-07, "epoch": 18.711674528301888, "percentage": 93.56, "elapsed_time": "1:01:36", "remaining_time": "0:04:14", "throughput": 5652.96, "total_tokens": 20896704} +{"current_steps": 31740, "total_steps": 33920, "loss": 0.2886, "lr": 1.254095137814776e-07, "epoch": 18.714622641509433, "percentage": 93.57, "elapsed_time": "1:01:37", "remaining_time": "0:04:13", "throughput": 5653.03, "total_tokens": 20900320} +{"current_steps": 31745, "total_steps": 33920, "loss": 0.318, "lr": 1.2483756572393368e-07, "epoch": 18.71757075471698, "percentage": 93.59, "elapsed_time": "1:01:37", "remaining_time": "0:04:13", "throughput": 5653.27, "total_tokens": 20905184} +{"current_steps": 31750, "total_steps": 33920, "loss": 0.3058, "lr": 1.242669083866549e-07, "epoch": 18.72051886792453, "percentage": 93.6, "elapsed_time": "1:01:38", "remaining_time": "0:04:12", "throughput": 5653.25, "total_tokens": 20908320} +{"current_steps": 31755, "total_steps": 33920, "loss": 0.3514, "lr": 1.2369754192072537e-07, "epoch": 18.723466981132077, "percentage": 93.62, "elapsed_time": "1:01:38", "remaining_time": "0:04:12", "throughput": 5653.07, "total_tokens": 20910624} +{"current_steps": 31760, "total_steps": 33920, "loss": 0.2971, "lr": 1.231294664768873e-07, "epoch": 18.72641509433962, "percentage": 93.63, "elapsed_time": "1:01:39", "remaining_time": "0:04:11", "throughput": 5653.11, "total_tokens": 20914016} +{"current_steps": 31765, "total_steps": 33920, "loss": 0.4624, "lr": 1.225626822055409e-07, "epoch": 18.72936320754717, "percentage": 93.65, "elapsed_time": "1:01:40", "remaining_time": "0:04:11", "throughput": 5653.13, "total_tokens": 20917088} +{"current_steps": 31770, "total_steps": 33920, "loss": 0.2951, "lr": 1.2199718925674508e-07, "epoch": 18.732311320754718, "percentage": 93.66, "elapsed_time": "1:01:40", "remaining_time": "0:04:10", "throughput": 5653.14, "total_tokens": 20920192} +{"current_steps": 31775, "total_steps": 33920, "loss": 0.3457, "lr": 1.2143298778021616e-07, "epoch": 18.735259433962263, "percentage": 93.68, "elapsed_time": "1:01:41", "remaining_time": "0:04:09", "throughput": 5653.07, "total_tokens": 20922912} +{"current_steps": 31780, "total_steps": 33920, "loss": 0.2978, "lr": 1.2087007792532967e-07, "epoch": 18.73820754716981, "percentage": 93.69, "elapsed_time": "1:01:41", "remaining_time": "0:04:09", "throughput": 5653.15, "total_tokens": 20926912} +{"current_steps": 31785, "total_steps": 33920, "loss": 0.4046, "lr": 1.203084598411175e-07, "epoch": 18.74115566037736, "percentage": 93.71, "elapsed_time": "1:01:42", "remaining_time": "0:04:08", "throughput": 5653.21, "total_tokens": 20930112} +{"current_steps": 31790, "total_steps": 33920, "loss": 0.2565, "lr": 1.1974813367627124e-07, "epoch": 18.744103773584907, "percentage": 93.72, "elapsed_time": "1:01:42", "remaining_time": "0:04:08", "throughput": 5653.3, "total_tokens": 20933984} +{"current_steps": 31795, "total_steps": 33920, "loss": 0.3247, "lr": 1.1918909957913949e-07, "epoch": 18.747051886792452, "percentage": 93.74, "elapsed_time": "1:01:43", "remaining_time": "0:04:07", "throughput": 5653.19, "total_tokens": 20936512} +{"current_steps": 31800, "total_steps": 33920, "loss": 0.3118, "lr": 1.1863135769772827e-07, "epoch": 18.75, "percentage": 93.75, "elapsed_time": "1:01:44", "remaining_time": "0:04:06", "throughput": 5653.1, "total_tokens": 20939072} +{"current_steps": 31805, "total_steps": 33920, "loss": 0.2144, "lr": 1.1807490817970279e-07, "epoch": 18.752948113207548, "percentage": 93.76, "elapsed_time": "1:01:44", "remaining_time": "0:04:06", "throughput": 5653.16, "total_tokens": 20942784} +{"current_steps": 31810, "total_steps": 33920, "loss": 0.4106, "lr": 1.1751975117238578e-07, "epoch": 18.755896226415093, "percentage": 93.78, "elapsed_time": "1:01:45", "remaining_time": "0:04:05", "throughput": 5653.13, "total_tokens": 20945696} +{"current_steps": 31815, "total_steps": 33920, "loss": 0.3534, "lr": 1.1696588682275633e-07, "epoch": 18.75884433962264, "percentage": 93.79, "elapsed_time": "1:01:45", "remaining_time": "0:04:05", "throughput": 5653.15, "total_tokens": 20949152} +{"current_steps": 31820, "total_steps": 33920, "loss": 0.418, "lr": 1.1641331527745325e-07, "epoch": 18.76179245283019, "percentage": 93.81, "elapsed_time": "1:01:46", "remaining_time": "0:04:04", "throughput": 5653.11, "total_tokens": 20952064} +{"current_steps": 31825, "total_steps": 33920, "loss": 0.2496, "lr": 1.1586203668277229e-07, "epoch": 18.764740566037737, "percentage": 93.82, "elapsed_time": "1:01:46", "remaining_time": "0:04:04", "throughput": 5652.99, "total_tokens": 20954752} +{"current_steps": 31830, "total_steps": 33920, "loss": 0.1909, "lr": 1.1531205118466615e-07, "epoch": 18.767688679245282, "percentage": 93.84, "elapsed_time": "1:01:47", "remaining_time": "0:04:03", "throughput": 5652.95, "total_tokens": 20957568} +{"current_steps": 31835, "total_steps": 33920, "loss": 0.3017, "lr": 1.1476335892874669e-07, "epoch": 18.77063679245283, "percentage": 93.85, "elapsed_time": "1:01:47", "remaining_time": "0:04:02", "throughput": 5652.88, "total_tokens": 20960640} +{"current_steps": 31840, "total_steps": 33920, "loss": 0.3018, "lr": 1.1421596006028157e-07, "epoch": 18.77358490566038, "percentage": 93.87, "elapsed_time": "1:01:48", "remaining_time": "0:04:02", "throughput": 5652.77, "total_tokens": 20963296} +{"current_steps": 31845, "total_steps": 33920, "loss": 0.3012, "lr": 1.1366985472419823e-07, "epoch": 18.776533018867923, "percentage": 93.88, "elapsed_time": "1:01:49", "remaining_time": "0:04:01", "throughput": 5652.8, "total_tokens": 20966304} +{"current_steps": 31850, "total_steps": 33920, "loss": 0.2614, "lr": 1.1312504306507987e-07, "epoch": 18.77948113207547, "percentage": 93.9, "elapsed_time": "1:01:49", "remaining_time": "0:04:01", "throughput": 5652.9, "total_tokens": 20969920} +{"current_steps": 31855, "total_steps": 33920, "loss": 0.279, "lr": 1.1258152522716725e-07, "epoch": 18.78242924528302, "percentage": 93.91, "elapsed_time": "1:01:50", "remaining_time": "0:04:00", "throughput": 5652.82, "total_tokens": 20972576} +{"current_steps": 31860, "total_steps": 33920, "loss": 0.3219, "lr": 1.1203930135435914e-07, "epoch": 18.785377358490567, "percentage": 93.93, "elapsed_time": "1:01:50", "remaining_time": "0:03:59", "throughput": 5652.89, "total_tokens": 20976384} +{"current_steps": 31865, "total_steps": 33920, "loss": 0.3315, "lr": 1.1149837159021238e-07, "epoch": 18.788325471698112, "percentage": 93.94, "elapsed_time": "1:01:51", "remaining_time": "0:03:59", "throughput": 5653.01, "total_tokens": 20980640} +{"current_steps": 31870, "total_steps": 33920, "loss": 0.2896, "lr": 1.1095873607793961e-07, "epoch": 18.79127358490566, "percentage": 93.96, "elapsed_time": "1:01:51", "remaining_time": "0:03:58", "throughput": 5652.97, "total_tokens": 20983424} +{"current_steps": 31875, "total_steps": 33920, "loss": 0.3201, "lr": 1.1042039496041212e-07, "epoch": 18.79422169811321, "percentage": 93.97, "elapsed_time": "1:01:52", "remaining_time": "0:03:58", "throughput": 5652.97, "total_tokens": 20986336} +{"current_steps": 31880, "total_steps": 33920, "loss": 0.2905, "lr": 1.0988334838015812e-07, "epoch": 18.797169811320753, "percentage": 93.99, "elapsed_time": "1:01:52", "remaining_time": "0:03:57", "throughput": 5653.04, "total_tokens": 20989696} +{"current_steps": 31885, "total_steps": 33920, "loss": 0.3561, "lr": 1.0934759647936333e-07, "epoch": 18.8001179245283, "percentage": 94.0, "elapsed_time": "1:01:53", "remaining_time": "0:03:57", "throughput": 5653.05, "total_tokens": 20992736} +{"current_steps": 31890, "total_steps": 33920, "loss": 0.3549, "lr": 1.0881313939986926e-07, "epoch": 18.80306603773585, "percentage": 94.02, "elapsed_time": "1:01:54", "remaining_time": "0:03:56", "throughput": 5653.2, "total_tokens": 20996544} +{"current_steps": 31895, "total_steps": 33920, "loss": 0.3562, "lr": 1.0827997728317662e-07, "epoch": 18.806014150943398, "percentage": 94.03, "elapsed_time": "1:01:54", "remaining_time": "0:03:55", "throughput": 5653.38, "total_tokens": 21001152} +{"current_steps": 31900, "total_steps": 33920, "loss": 0.3298, "lr": 1.0774811027044196e-07, "epoch": 18.808962264150942, "percentage": 94.04, "elapsed_time": "1:01:55", "remaining_time": "0:03:55", "throughput": 5653.31, "total_tokens": 21003840} +{"current_steps": 31905, "total_steps": 33920, "loss": 0.3496, "lr": 1.0721753850247984e-07, "epoch": 18.81191037735849, "percentage": 94.06, "elapsed_time": "1:01:55", "remaining_time": "0:03:54", "throughput": 5653.27, "total_tokens": 21007168} +{"current_steps": 31910, "total_steps": 33920, "loss": 0.2527, "lr": 1.0668826211976124e-07, "epoch": 18.81485849056604, "percentage": 94.07, "elapsed_time": "1:01:56", "remaining_time": "0:03:54", "throughput": 5653.26, "total_tokens": 21010112} +{"current_steps": 31915, "total_steps": 33920, "loss": 0.3332, "lr": 1.0616028126241407e-07, "epoch": 18.817806603773583, "percentage": 94.09, "elapsed_time": "1:01:56", "remaining_time": "0:03:53", "throughput": 5653.21, "total_tokens": 21012896} +{"current_steps": 31920, "total_steps": 33920, "loss": 0.3161, "lr": 1.0563359607022372e-07, "epoch": 18.82075471698113, "percentage": 94.1, "elapsed_time": "1:01:57", "remaining_time": "0:03:52", "throughput": 5653.2, "total_tokens": 21015840} +{"current_steps": 31925, "total_steps": 33920, "loss": 0.3291, "lr": 1.05108206682632e-07, "epoch": 18.82370283018868, "percentage": 94.12, "elapsed_time": "1:01:58", "remaining_time": "0:03:52", "throughput": 5653.13, "total_tokens": 21018496} +{"current_steps": 31930, "total_steps": 33920, "loss": 0.416, "lr": 1.0458411323873874e-07, "epoch": 18.826650943396228, "percentage": 94.13, "elapsed_time": "1:01:58", "remaining_time": "0:03:51", "throughput": 5653.2, "total_tokens": 21022144} +{"current_steps": 31935, "total_steps": 33920, "loss": 0.3393, "lr": 1.0406131587729962e-07, "epoch": 18.829599056603772, "percentage": 94.15, "elapsed_time": "1:01:59", "remaining_time": "0:03:51", "throughput": 5653.19, "total_tokens": 21025408} +{"current_steps": 31940, "total_steps": 33920, "loss": 0.2728, "lr": 1.035398147367278e-07, "epoch": 18.83254716981132, "percentage": 94.16, "elapsed_time": "1:01:59", "remaining_time": "0:03:50", "throughput": 5653.23, "total_tokens": 21028864} +{"current_steps": 31945, "total_steps": 33920, "loss": 0.3146, "lr": 1.030196099550923e-07, "epoch": 18.83549528301887, "percentage": 94.18, "elapsed_time": "1:02:00", "remaining_time": "0:03:50", "throughput": 5653.23, "total_tokens": 21032032} +{"current_steps": 31950, "total_steps": 33920, "loss": 0.3748, "lr": 1.0250070167011905e-07, "epoch": 18.838443396226417, "percentage": 94.19, "elapsed_time": "1:02:00", "remaining_time": "0:03:49", "throughput": 5653.36, "total_tokens": 21035808} +{"current_steps": 31955, "total_steps": 33920, "loss": 0.3052, "lr": 1.0198309001919315e-07, "epoch": 18.84139150943396, "percentage": 94.21, "elapsed_time": "1:02:01", "remaining_time": "0:03:48", "throughput": 5653.43, "total_tokens": 21039616} +{"current_steps": 31960, "total_steps": 33920, "loss": 0.4245, "lr": 1.0146677513935277e-07, "epoch": 18.84433962264151, "percentage": 94.22, "elapsed_time": "1:02:02", "remaining_time": "0:03:48", "throughput": 5653.32, "total_tokens": 21042368} +{"current_steps": 31965, "total_steps": 33920, "loss": 0.2756, "lr": 1.0095175716729578e-07, "epoch": 18.847287735849058, "percentage": 94.24, "elapsed_time": "1:02:02", "remaining_time": "0:03:47", "throughput": 5653.41, "total_tokens": 21045984} +{"current_steps": 31970, "total_steps": 33920, "loss": 0.3144, "lr": 1.004380362393742e-07, "epoch": 18.850235849056602, "percentage": 94.25, "elapsed_time": "1:02:03", "remaining_time": "0:03:47", "throughput": 5653.38, "total_tokens": 21049056} +{"current_steps": 31975, "total_steps": 33920, "loss": 0.2716, "lr": 9.99256124915987e-08, "epoch": 18.85318396226415, "percentage": 94.27, "elapsed_time": "1:02:03", "remaining_time": "0:03:46", "throughput": 5653.26, "total_tokens": 21051712} +{"current_steps": 31980, "total_steps": 33920, "loss": 0.2737, "lr": 9.941448605963577e-08, "epoch": 18.8561320754717, "percentage": 94.28, "elapsed_time": "1:02:04", "remaining_time": "0:03:45", "throughput": 5653.16, "total_tokens": 21054336} +{"current_steps": 31985, "total_steps": 33920, "loss": 0.2659, "lr": 9.890465707880715e-08, "epoch": 18.859080188679247, "percentage": 94.3, "elapsed_time": "1:02:04", "remaining_time": "0:03:45", "throughput": 5653.19, "total_tokens": 21057536} +{"current_steps": 31990, "total_steps": 33920, "loss": 0.268, "lr": 9.839612568409374e-08, "epoch": 18.86202830188679, "percentage": 94.31, "elapsed_time": "1:02:05", "remaining_time": "0:03:44", "throughput": 5653.16, "total_tokens": 21060448} +{"current_steps": 31995, "total_steps": 33920, "loss": 0.2773, "lr": 9.788889201013119e-08, "epoch": 18.86497641509434, "percentage": 94.32, "elapsed_time": "1:02:06", "remaining_time": "0:03:44", "throughput": 5652.97, "total_tokens": 21062976} +{"current_steps": 32000, "total_steps": 33920, "loss": 0.1921, "lr": 9.738295619121097e-08, "epoch": 18.867924528301888, "percentage": 94.34, "elapsed_time": "1:02:06", "remaining_time": "0:03:43", "throughput": 5652.93, "total_tokens": 21066144} +{"current_steps": 32005, "total_steps": 33920, "loss": 0.2307, "lr": 9.687831836128203e-08, "epoch": 18.870872641509433, "percentage": 94.35, "elapsed_time": "1:02:07", "remaining_time": "0:03:43", "throughput": 5652.92, "total_tokens": 21069440} +{"current_steps": 32010, "total_steps": 33920, "loss": 0.3318, "lr": 9.637497865395029e-08, "epoch": 18.87382075471698, "percentage": 94.37, "elapsed_time": "1:02:07", "remaining_time": "0:03:42", "throughput": 5653.08, "total_tokens": 21073536} +{"current_steps": 32015, "total_steps": 33920, "loss": 0.2782, "lr": 9.587293720247526e-08, "epoch": 18.87676886792453, "percentage": 94.38, "elapsed_time": "1:02:08", "remaining_time": "0:03:41", "throughput": 5653.09, "total_tokens": 21076672} +{"current_steps": 32020, "total_steps": 33920, "loss": 0.3116, "lr": 9.537219413977672e-08, "epoch": 18.879716981132077, "percentage": 94.4, "elapsed_time": "1:02:08", "remaining_time": "0:03:41", "throughput": 5653.26, "total_tokens": 21080672} +{"current_steps": 32025, "total_steps": 33920, "loss": 0.2796, "lr": 9.487274959842696e-08, "epoch": 18.88266509433962, "percentage": 94.41, "elapsed_time": "1:02:09", "remaining_time": "0:03:40", "throughput": 5653.33, "total_tokens": 21084384} +{"current_steps": 32030, "total_steps": 33920, "loss": 0.3324, "lr": 9.437460371065687e-08, "epoch": 18.88561320754717, "percentage": 94.43, "elapsed_time": "1:02:10", "remaining_time": "0:03:40", "throughput": 5653.24, "total_tokens": 21087200} +{"current_steps": 32035, "total_steps": 33920, "loss": 0.2136, "lr": 9.387775660835263e-08, "epoch": 18.888561320754718, "percentage": 94.44, "elapsed_time": "1:02:10", "remaining_time": "0:03:39", "throughput": 5653.33, "total_tokens": 21090560} +{"current_steps": 32040, "total_steps": 33920, "loss": 0.2969, "lr": 9.338220842305678e-08, "epoch": 18.891509433962263, "percentage": 94.46, "elapsed_time": "1:02:11", "remaining_time": "0:03:38", "throughput": 5653.37, "total_tokens": 21093728} +{"current_steps": 32045, "total_steps": 33920, "loss": 0.3623, "lr": 9.288795928596661e-08, "epoch": 18.89445754716981, "percentage": 94.47, "elapsed_time": "1:02:11", "remaining_time": "0:03:38", "throughput": 5653.47, "total_tokens": 21097472} +{"current_steps": 32050, "total_steps": 33920, "loss": 0.3069, "lr": 9.239500932793854e-08, "epoch": 18.89740566037736, "percentage": 94.49, "elapsed_time": "1:02:12", "remaining_time": "0:03:37", "throughput": 5653.67, "total_tokens": 21101920} +{"current_steps": 32055, "total_steps": 33920, "loss": 0.3185, "lr": 9.190335867948263e-08, "epoch": 18.900353773584907, "percentage": 94.5, "elapsed_time": "1:02:12", "remaining_time": "0:03:37", "throughput": 5653.57, "total_tokens": 21104672} +{"current_steps": 32060, "total_steps": 33920, "loss": 0.271, "lr": 9.141300747076476e-08, "epoch": 18.903301886792452, "percentage": 94.52, "elapsed_time": "1:02:13", "remaining_time": "0:03:36", "throughput": 5653.37, "total_tokens": 21106944} +{"current_steps": 32065, "total_steps": 33920, "loss": 0.2833, "lr": 9.092395583160773e-08, "epoch": 18.90625, "percentage": 94.53, "elapsed_time": "1:02:14", "remaining_time": "0:03:36", "throughput": 5653.26, "total_tokens": 21109600} +{"current_steps": 32070, "total_steps": 33920, "loss": 0.3279, "lr": 9.043620389149021e-08, "epoch": 18.909198113207548, "percentage": 94.55, "elapsed_time": "1:02:14", "remaining_time": "0:03:35", "throughput": 5653.26, "total_tokens": 21112960} +{"current_steps": 32075, "total_steps": 33920, "loss": 0.3178, "lr": 8.994975177954723e-08, "epoch": 18.912146226415093, "percentage": 94.56, "elapsed_time": "1:02:15", "remaining_time": "0:03:34", "throughput": 5653.21, "total_tokens": 21115776} +{"current_steps": 32080, "total_steps": 33920, "loss": 0.3191, "lr": 8.946459962456855e-08, "epoch": 18.91509433962264, "percentage": 94.58, "elapsed_time": "1:02:15", "remaining_time": "0:03:34", "throughput": 5653.27, "total_tokens": 21119296} +{"current_steps": 32085, "total_steps": 33920, "loss": 0.2418, "lr": 8.89807475550003e-08, "epoch": 18.91804245283019, "percentage": 94.59, "elapsed_time": "1:02:16", "remaining_time": "0:03:33", "throughput": 5653.21, "total_tokens": 21122208} +{"current_steps": 32090, "total_steps": 33920, "loss": 0.3162, "lr": 8.849819569894447e-08, "epoch": 18.920990566037737, "percentage": 94.6, "elapsed_time": "1:02:16", "remaining_time": "0:03:33", "throughput": 5653.16, "total_tokens": 21125248} +{"current_steps": 32095, "total_steps": 33920, "loss": 0.2741, "lr": 8.801694418415884e-08, "epoch": 18.923938679245282, "percentage": 94.62, "elapsed_time": "1:02:17", "remaining_time": "0:03:32", "throughput": 5653.17, "total_tokens": 21128192} +{"current_steps": 32100, "total_steps": 33920, "loss": 0.4065, "lr": 8.753699313805708e-08, "epoch": 18.92688679245283, "percentage": 94.63, "elapsed_time": "1:02:17", "remaining_time": "0:03:31", "throughput": 5653.14, "total_tokens": 21131200} +{"current_steps": 32105, "total_steps": 33920, "loss": 0.3387, "lr": 8.705834268770753e-08, "epoch": 18.92983490566038, "percentage": 94.65, "elapsed_time": "1:02:18", "remaining_time": "0:03:31", "throughput": 5653.08, "total_tokens": 21134144} +{"current_steps": 32110, "total_steps": 33920, "loss": 0.389, "lr": 8.65809929598349e-08, "epoch": 18.932783018867923, "percentage": 94.66, "elapsed_time": "1:02:19", "remaining_time": "0:03:30", "throughput": 5653.1, "total_tokens": 21137344} +{"current_steps": 32115, "total_steps": 33920, "loss": 0.2981, "lr": 8.610494408082037e-08, "epoch": 18.93573113207547, "percentage": 94.68, "elapsed_time": "1:02:19", "remaining_time": "0:03:30", "throughput": 5653.07, "total_tokens": 21140512} +{"current_steps": 32120, "total_steps": 33920, "loss": 0.302, "lr": 8.563019617669977e-08, "epoch": 18.93867924528302, "percentage": 94.69, "elapsed_time": "1:02:20", "remaining_time": "0:03:29", "throughput": 5653.2, "total_tokens": 21144032} +{"current_steps": 32125, "total_steps": 33920, "loss": 0.4552, "lr": 8.51567493731642e-08, "epoch": 18.941627358490567, "percentage": 94.71, "elapsed_time": "1:02:20", "remaining_time": "0:03:29", "throughput": 5653.16, "total_tokens": 21146912} +{"current_steps": 32130, "total_steps": 33920, "loss": 0.2838, "lr": 8.468460379556176e-08, "epoch": 18.944575471698112, "percentage": 94.72, "elapsed_time": "1:02:21", "remaining_time": "0:03:28", "throughput": 5653.24, "total_tokens": 21150848} +{"current_steps": 32135, "total_steps": 33920, "loss": 0.3783, "lr": 8.421375956889355e-08, "epoch": 18.94752358490566, "percentage": 94.74, "elapsed_time": "1:02:22", "remaining_time": "0:03:27", "throughput": 5653.31, "total_tokens": 21154912} +{"current_steps": 32140, "total_steps": 33920, "loss": 0.2869, "lr": 8.374421681781819e-08, "epoch": 18.95047169811321, "percentage": 94.75, "elapsed_time": "1:02:22", "remaining_time": "0:03:27", "throughput": 5653.38, "total_tokens": 21159136} +{"current_steps": 32145, "total_steps": 33920, "loss": 0.4012, "lr": 8.327597566665013e-08, "epoch": 18.953419811320753, "percentage": 94.77, "elapsed_time": "1:02:23", "remaining_time": "0:03:26", "throughput": 5653.42, "total_tokens": 21162688} +{"current_steps": 32150, "total_steps": 33920, "loss": 0.283, "lr": 8.280903623935688e-08, "epoch": 18.9563679245283, "percentage": 94.78, "elapsed_time": "1:02:23", "remaining_time": "0:03:26", "throughput": 5653.48, "total_tokens": 21166400} +{"current_steps": 32155, "total_steps": 33920, "loss": 0.4112, "lr": 8.234339865956342e-08, "epoch": 18.95931603773585, "percentage": 94.8, "elapsed_time": "1:02:24", "remaining_time": "0:03:25", "throughput": 5653.58, "total_tokens": 21170880} +{"current_steps": 32160, "total_steps": 33920, "loss": 0.3218, "lr": 8.187906305054838e-08, "epoch": 18.962264150943398, "percentage": 94.81, "elapsed_time": "1:02:25", "remaining_time": "0:03:24", "throughput": 5653.58, "total_tokens": 21173856} +{"current_steps": 32165, "total_steps": 33920, "loss": 0.2773, "lr": 8.141602953524841e-08, "epoch": 18.965212264150942, "percentage": 94.83, "elapsed_time": "1:02:25", "remaining_time": "0:03:24", "throughput": 5653.53, "total_tokens": 21176896} +{"current_steps": 32170, "total_steps": 33920, "loss": 0.2673, "lr": 8.095429823625212e-08, "epoch": 18.96816037735849, "percentage": 94.84, "elapsed_time": "1:02:26", "remaining_time": "0:03:23", "throughput": 5653.65, "total_tokens": 21180576} +{"current_steps": 32175, "total_steps": 33920, "loss": 0.2532, "lr": 8.04938692758045e-08, "epoch": 18.97110849056604, "percentage": 94.86, "elapsed_time": "1:02:26", "remaining_time": "0:03:23", "throughput": 5653.72, "total_tokens": 21184160} +{"current_steps": 32180, "total_steps": 33920, "loss": 0.3168, "lr": 8.003474277580803e-08, "epoch": 18.974056603773583, "percentage": 94.87, "elapsed_time": "1:02:27", "remaining_time": "0:03:22", "throughput": 5653.78, "total_tokens": 21187584} +{"current_steps": 32185, "total_steps": 33920, "loss": 0.2607, "lr": 7.95769188578166e-08, "epoch": 18.97700471698113, "percentage": 94.89, "elapsed_time": "1:02:28", "remaining_time": "0:03:22", "throughput": 5653.73, "total_tokens": 21190592} +{"current_steps": 32190, "total_steps": 33920, "loss": 0.2441, "lr": 7.912039764304213e-08, "epoch": 18.97995283018868, "percentage": 94.9, "elapsed_time": "1:02:28", "remaining_time": "0:03:21", "throughput": 5653.68, "total_tokens": 21193472} +{"current_steps": 32195, "total_steps": 33920, "loss": 0.378, "lr": 7.866517925235017e-08, "epoch": 18.982900943396228, "percentage": 94.91, "elapsed_time": "1:02:29", "remaining_time": "0:03:20", "throughput": 5653.59, "total_tokens": 21196640} +{"current_steps": 32200, "total_steps": 33920, "loss": 0.388, "lr": 7.821126380626154e-08, "epoch": 18.985849056603772, "percentage": 94.93, "elapsed_time": "1:02:29", "remaining_time": "0:03:20", "throughput": 5653.47, "total_tokens": 21199168} +{"current_steps": 32205, "total_steps": 33920, "loss": 0.2318, "lr": 7.775865142495286e-08, "epoch": 18.98879716981132, "percentage": 94.94, "elapsed_time": "1:02:30", "remaining_time": "0:03:19", "throughput": 5653.47, "total_tokens": 21202592} +{"current_steps": 32210, "total_steps": 33920, "loss": 0.3996, "lr": 7.730734222825442e-08, "epoch": 18.99174528301887, "percentage": 94.96, "elapsed_time": "1:02:30", "remaining_time": "0:03:19", "throughput": 5653.51, "total_tokens": 21206176} +{"current_steps": 32215, "total_steps": 33920, "loss": 0.377, "lr": 7.68573363356534e-08, "epoch": 18.994693396226417, "percentage": 94.97, "elapsed_time": "1:02:31", "remaining_time": "0:03:18", "throughput": 5653.63, "total_tokens": 21209952} +{"current_steps": 32220, "total_steps": 33920, "loss": 0.3378, "lr": 7.640863386629005e-08, "epoch": 18.99764150943396, "percentage": 94.99, "elapsed_time": "1:02:32", "remaining_time": "0:03:17", "throughput": 5653.63, "total_tokens": 21212960} +{"current_steps": 32225, "total_steps": 33920, "loss": 0.2898, "lr": 7.59612349389599e-08, "epoch": 19.00058962264151, "percentage": 95.0, "elapsed_time": "1:02:33", "remaining_time": "0:03:17", "throughput": 5652.81, "total_tokens": 21215152} +{"current_steps": 32230, "total_steps": 33920, "loss": 0.3032, "lr": 7.551513967211433e-08, "epoch": 19.003537735849058, "percentage": 95.02, "elapsed_time": "1:02:33", "remaining_time": "0:03:16", "throughput": 5652.79, "total_tokens": 21218544} +{"current_steps": 32235, "total_steps": 33920, "loss": 0.2807, "lr": 7.507034818385883e-08, "epoch": 19.006485849056602, "percentage": 95.03, "elapsed_time": "1:02:34", "remaining_time": "0:03:16", "throughput": 5652.84, "total_tokens": 21222000} +{"current_steps": 32240, "total_steps": 33920, "loss": 0.3521, "lr": 7.462686059195423e-08, "epoch": 19.00943396226415, "percentage": 95.05, "elapsed_time": "1:02:34", "remaining_time": "0:03:15", "throughput": 5652.85, "total_tokens": 21225840} +{"current_steps": 32245, "total_steps": 33920, "loss": 0.2847, "lr": 7.418467701381548e-08, "epoch": 19.0123820754717, "percentage": 95.06, "elapsed_time": "1:02:35", "remaining_time": "0:03:15", "throughput": 5652.9, "total_tokens": 21229360} +{"current_steps": 32250, "total_steps": 33920, "loss": 0.3094, "lr": 7.374379756651285e-08, "epoch": 19.015330188679247, "percentage": 95.08, "elapsed_time": "1:02:36", "remaining_time": "0:03:14", "throughput": 5652.84, "total_tokens": 21232176} +{"current_steps": 32255, "total_steps": 33920, "loss": 0.2887, "lr": 7.330422236677015e-08, "epoch": 19.01827830188679, "percentage": 95.09, "elapsed_time": "1:02:36", "remaining_time": "0:03:13", "throughput": 5652.81, "total_tokens": 21235216} +{"current_steps": 32260, "total_steps": 33920, "loss": 0.3306, "lr": 7.286595153096765e-08, "epoch": 19.02122641509434, "percentage": 95.11, "elapsed_time": "1:02:37", "remaining_time": "0:03:13", "throughput": 5652.8, "total_tokens": 21238256} +{"current_steps": 32265, "total_steps": 33920, "loss": 0.2561, "lr": 7.242898517513864e-08, "epoch": 19.024174528301888, "percentage": 95.12, "elapsed_time": "1:02:37", "remaining_time": "0:03:12", "throughput": 5652.75, "total_tokens": 21241296} +{"current_steps": 32270, "total_steps": 33920, "loss": 0.364, "lr": 7.199332341497333e-08, "epoch": 19.027122641509433, "percentage": 95.14, "elapsed_time": "1:02:38", "remaining_time": "0:03:12", "throughput": 5652.54, "total_tokens": 21243600} +{"current_steps": 32275, "total_steps": 33920, "loss": 0.229, "lr": 7.155896636581394e-08, "epoch": 19.03007075471698, "percentage": 95.15, "elapsed_time": "1:02:38", "remaining_time": "0:03:11", "throughput": 5652.5, "total_tokens": 21246544} +{"current_steps": 32280, "total_steps": 33920, "loss": 0.2356, "lr": 7.112591414265901e-08, "epoch": 19.03301886792453, "percentage": 95.17, "elapsed_time": "1:02:39", "remaining_time": "0:03:11", "throughput": 5652.58, "total_tokens": 21250576} +{"current_steps": 32285, "total_steps": 33920, "loss": 0.2541, "lr": 7.069416686016018e-08, "epoch": 19.035966981132077, "percentage": 95.18, "elapsed_time": "1:02:40", "remaining_time": "0:03:10", "throughput": 5652.5, "total_tokens": 21253392} +{"current_steps": 32290, "total_steps": 33920, "loss": 0.2761, "lr": 7.026372463262488e-08, "epoch": 19.03891509433962, "percentage": 95.19, "elapsed_time": "1:02:40", "remaining_time": "0:03:09", "throughput": 5652.68, "total_tokens": 21258064} +{"current_steps": 32295, "total_steps": 33920, "loss": 0.3237, "lr": 6.983458757401418e-08, "epoch": 19.04186320754717, "percentage": 95.21, "elapsed_time": "1:02:41", "remaining_time": "0:03:09", "throughput": 5652.72, "total_tokens": 21261488} +{"current_steps": 32300, "total_steps": 33920, "loss": 0.3082, "lr": 6.940675579794443e-08, "epoch": 19.044811320754718, "percentage": 95.22, "elapsed_time": "1:02:41", "remaining_time": "0:03:08", "throughput": 5652.73, "total_tokens": 21264624} +{"current_steps": 32305, "total_steps": 33920, "loss": 0.2444, "lr": 6.898022941768612e-08, "epoch": 19.047759433962263, "percentage": 95.24, "elapsed_time": "1:02:42", "remaining_time": "0:03:08", "throughput": 5652.63, "total_tokens": 21267184} +{"current_steps": 32310, "total_steps": 33920, "loss": 0.3667, "lr": 6.855500854616337e-08, "epoch": 19.05070754716981, "percentage": 95.25, "elapsed_time": "1:02:42", "remaining_time": "0:03:07", "throughput": 5652.66, "total_tokens": 21270704} +{"current_steps": 32315, "total_steps": 33920, "loss": 0.3057, "lr": 6.813109329595557e-08, "epoch": 19.05365566037736, "percentage": 95.27, "elapsed_time": "1:02:43", "remaining_time": "0:03:06", "throughput": 5652.58, "total_tokens": 21273520} +{"current_steps": 32320, "total_steps": 33920, "loss": 0.3025, "lr": 6.770848377929573e-08, "epoch": 19.056603773584907, "percentage": 95.28, "elapsed_time": "1:02:44", "remaining_time": "0:03:06", "throughput": 5652.61, "total_tokens": 21277040} +{"current_steps": 32325, "total_steps": 33920, "loss": 0.2931, "lr": 6.728718010807156e-08, "epoch": 19.059551886792452, "percentage": 95.3, "elapsed_time": "1:02:44", "remaining_time": "0:03:05", "throughput": 5652.57, "total_tokens": 21279888} +{"current_steps": 32330, "total_steps": 33920, "loss": 0.382, "lr": 6.68671823938255e-08, "epoch": 19.0625, "percentage": 95.31, "elapsed_time": "1:02:45", "remaining_time": "0:03:05", "throughput": 5652.34, "total_tokens": 21282320} +{"current_steps": 32335, "total_steps": 33920, "loss": 0.2964, "lr": 6.644849074775361e-08, "epoch": 19.065448113207548, "percentage": 95.33, "elapsed_time": "1:02:45", "remaining_time": "0:03:04", "throughput": 5652.3, "total_tokens": 21285296} +{"current_steps": 32340, "total_steps": 33920, "loss": 0.424, "lr": 6.603110528070667e-08, "epoch": 19.068396226415093, "percentage": 95.34, "elapsed_time": "1:02:46", "remaining_time": "0:03:04", "throughput": 5652.37, "total_tokens": 21289008} +{"current_steps": 32345, "total_steps": 33920, "loss": 0.2611, "lr": 6.561502610318849e-08, "epoch": 19.07134433962264, "percentage": 95.36, "elapsed_time": "1:02:46", "remaining_time": "0:03:03", "throughput": 5652.27, "total_tokens": 21291952} +{"current_steps": 32350, "total_steps": 33920, "loss": 0.2914, "lr": 6.520025332535762e-08, "epoch": 19.07429245283019, "percentage": 95.37, "elapsed_time": "1:02:47", "remaining_time": "0:03:02", "throughput": 5652.39, "total_tokens": 21295632} +{"current_steps": 32355, "total_steps": 33920, "loss": 0.419, "lr": 6.47867870570279e-08, "epoch": 19.077240566037737, "percentage": 95.39, "elapsed_time": "1:02:48", "remaining_time": "0:03:02", "throughput": 5652.34, "total_tokens": 21298448} +{"current_steps": 32360, "total_steps": 33920, "loss": 0.3058, "lr": 6.437462740766564e-08, "epoch": 19.080188679245282, "percentage": 95.4, "elapsed_time": "1:02:48", "remaining_time": "0:03:01", "throughput": 5652.37, "total_tokens": 21301776} +{"current_steps": 32365, "total_steps": 33920, "loss": 0.3908, "lr": 6.396377448639246e-08, "epoch": 19.08313679245283, "percentage": 95.42, "elapsed_time": "1:02:49", "remaining_time": "0:03:01", "throughput": 5652.41, "total_tokens": 21305168} +{"current_steps": 32370, "total_steps": 33920, "loss": 0.2703, "lr": 6.3554228401983e-08, "epoch": 19.08608490566038, "percentage": 95.43, "elapsed_time": "1:02:49", "remaining_time": "0:03:00", "throughput": 5652.34, "total_tokens": 21307856} +{"current_steps": 32375, "total_steps": 33920, "loss": 0.2725, "lr": 6.314598926286663e-08, "epoch": 19.089033018867923, "percentage": 95.45, "elapsed_time": "1:02:50", "remaining_time": "0:02:59", "throughput": 5652.33, "total_tokens": 21311088} +{"current_steps": 32380, "total_steps": 33920, "loss": 0.3902, "lr": 6.273905717712637e-08, "epoch": 19.09198113207547, "percentage": 95.46, "elapsed_time": "1:02:50", "remaining_time": "0:02:59", "throughput": 5652.38, "total_tokens": 21314544} +{"current_steps": 32385, "total_steps": 33920, "loss": 0.2765, "lr": 6.233343225249933e-08, "epoch": 19.09492924528302, "percentage": 95.47, "elapsed_time": "1:02:51", "remaining_time": "0:02:58", "throughput": 5652.3, "total_tokens": 21317168} +{"current_steps": 32390, "total_steps": 33920, "loss": 0.348, "lr": 6.192911459637519e-08, "epoch": 19.097877358490567, "percentage": 95.49, "elapsed_time": "1:02:51", "remaining_time": "0:02:58", "throughput": 5652.31, "total_tokens": 21320208} +{"current_steps": 32395, "total_steps": 33920, "loss": 0.3421, "lr": 6.152610431580052e-08, "epoch": 19.100825471698112, "percentage": 95.5, "elapsed_time": "1:02:52", "remaining_time": "0:02:57", "throughput": 5652.3, "total_tokens": 21323152} +{"current_steps": 32400, "total_steps": 33920, "loss": 0.3556, "lr": 6.112440151747389e-08, "epoch": 19.10377358490566, "percentage": 95.52, "elapsed_time": "1:02:53", "remaining_time": "0:02:57", "throughput": 5652.27, "total_tokens": 21326160} +{"current_steps": 32405, "total_steps": 33920, "loss": 0.3095, "lr": 6.072400630774689e-08, "epoch": 19.10672169811321, "percentage": 95.53, "elapsed_time": "1:02:53", "remaining_time": "0:02:56", "throughput": 5652.29, "total_tokens": 21329264} +{"current_steps": 32410, "total_steps": 33920, "loss": 0.2777, "lr": 6.032491879262637e-08, "epoch": 19.109669811320753, "percentage": 95.55, "elapsed_time": "1:02:54", "remaining_time": "0:02:55", "throughput": 5652.2, "total_tokens": 21332016} +{"current_steps": 32415, "total_steps": 33920, "loss": 0.2691, "lr": 5.99271390777717e-08, "epoch": 19.1126179245283, "percentage": 95.56, "elapsed_time": "1:02:54", "remaining_time": "0:02:55", "throughput": 5652.15, "total_tokens": 21334992} +{"current_steps": 32420, "total_steps": 33920, "loss": 0.2207, "lr": 5.953066726849865e-08, "epoch": 19.11556603773585, "percentage": 95.58, "elapsed_time": "1:02:55", "remaining_time": "0:02:54", "throughput": 5652.17, "total_tokens": 21338032} +{"current_steps": 32425, "total_steps": 33920, "loss": 0.3282, "lr": 5.913550346977326e-08, "epoch": 19.118514150943398, "percentage": 95.59, "elapsed_time": "1:02:55", "remaining_time": "0:02:54", "throughput": 5652.23, "total_tokens": 21342032} +{"current_steps": 32430, "total_steps": 33920, "loss": 0.2933, "lr": 5.874164778621683e-08, "epoch": 19.121462264150942, "percentage": 95.61, "elapsed_time": "1:02:56", "remaining_time": "0:02:53", "throughput": 5652.43, "total_tokens": 21346736} +{"current_steps": 32435, "total_steps": 33920, "loss": 0.2501, "lr": 5.834910032210539e-08, "epoch": 19.12441037735849, "percentage": 95.62, "elapsed_time": "1:02:57", "remaining_time": "0:02:52", "throughput": 5652.36, "total_tokens": 21349488} +{"current_steps": 32440, "total_steps": 33920, "loss": 0.4349, "lr": 5.795786118136693e-08, "epoch": 19.12735849056604, "percentage": 95.64, "elapsed_time": "1:02:57", "remaining_time": "0:02:52", "throughput": 5652.38, "total_tokens": 21352784} +{"current_steps": 32445, "total_steps": 33920, "loss": 0.3724, "lr": 5.756793046758302e-08, "epoch": 19.130306603773583, "percentage": 95.65, "elapsed_time": "1:02:58", "remaining_time": "0:02:51", "throughput": 5652.22, "total_tokens": 21355248} +{"current_steps": 32450, "total_steps": 33920, "loss": 0.276, "lr": 5.7179308283990544e-08, "epoch": 19.13325471698113, "percentage": 95.67, "elapsed_time": "1:02:58", "remaining_time": "0:02:51", "throughput": 5652.29, "total_tokens": 21358832} +{"current_steps": 32455, "total_steps": 33920, "loss": 0.427, "lr": 5.679199473347885e-08, "epoch": 19.13620283018868, "percentage": 95.68, "elapsed_time": "1:02:59", "remaining_time": "0:02:50", "throughput": 5652.22, "total_tokens": 21361552} +{"current_steps": 32460, "total_steps": 33920, "loss": 0.2596, "lr": 5.6405989918590366e-08, "epoch": 19.139150943396228, "percentage": 95.7, "elapsed_time": "1:03:00", "remaining_time": "0:02:50", "throughput": 5652.28, "total_tokens": 21365648} +{"current_steps": 32465, "total_steps": 33920, "loss": 0.2447, "lr": 5.6021293941522225e-08, "epoch": 19.142099056603772, "percentage": 95.71, "elapsed_time": "1:03:00", "remaining_time": "0:02:49", "throughput": 5652.32, "total_tokens": 21369136} +{"current_steps": 32470, "total_steps": 33920, "loss": 0.2511, "lr": 5.563790690412352e-08, "epoch": 19.14504716981132, "percentage": 95.73, "elapsed_time": "1:03:01", "remaining_time": "0:02:48", "throughput": 5652.35, "total_tokens": 21372304} +{"current_steps": 32475, "total_steps": 33920, "loss": 0.4385, "lr": 5.525582890789805e-08, "epoch": 19.14799528301887, "percentage": 95.74, "elapsed_time": "1:03:01", "remaining_time": "0:02:48", "throughput": 5652.28, "total_tokens": 21375184} +{"current_steps": 32480, "total_steps": 33920, "loss": 0.3633, "lr": 5.4875060054002115e-08, "epoch": 19.150943396226417, "percentage": 95.75, "elapsed_time": "1:03:02", "remaining_time": "0:02:47", "throughput": 5652.36, "total_tokens": 21378960} +{"current_steps": 32485, "total_steps": 33920, "loss": 0.3565, "lr": 5.4495600443246755e-08, "epoch": 19.15389150943396, "percentage": 95.77, "elapsed_time": "1:03:02", "remaining_time": "0:02:47", "throughput": 5652.3, "total_tokens": 21381808} +{"current_steps": 32490, "total_steps": 33920, "loss": 0.2618, "lr": 5.411745017609493e-08, "epoch": 19.15683962264151, "percentage": 95.78, "elapsed_time": "1:03:03", "remaining_time": "0:02:46", "throughput": 5652.17, "total_tokens": 21384592} +{"current_steps": 32495, "total_steps": 33920, "loss": 0.2724, "lr": 5.374060935266434e-08, "epoch": 19.159787735849058, "percentage": 95.8, "elapsed_time": "1:03:04", "remaining_time": "0:02:45", "throughput": 5652.23, "total_tokens": 21388304} +{"current_steps": 32500, "total_steps": 33920, "loss": 0.313, "lr": 5.3365078072724065e-08, "epoch": 19.162735849056602, "percentage": 95.81, "elapsed_time": "1:03:04", "remaining_time": "0:02:45", "throughput": 5652.32, "total_tokens": 21391824} +{"current_steps": 32505, "total_steps": 33920, "loss": 0.2316, "lr": 5.299085643569846e-08, "epoch": 19.16568396226415, "percentage": 95.83, "elapsed_time": "1:03:05", "remaining_time": "0:02:44", "throughput": 5652.38, "total_tokens": 21395056} +{"current_steps": 32510, "total_steps": 33920, "loss": 0.2785, "lr": 5.261794454066327e-08, "epoch": 19.1686320754717, "percentage": 95.84, "elapsed_time": "1:03:05", "remaining_time": "0:02:44", "throughput": 5652.45, "total_tokens": 21398608} +{"current_steps": 32515, "total_steps": 33920, "loss": 0.2068, "lr": 5.224634248635008e-08, "epoch": 19.171580188679247, "percentage": 95.86, "elapsed_time": "1:03:06", "remaining_time": "0:02:43", "throughput": 5652.54, "total_tokens": 21402704} +{"current_steps": 32520, "total_steps": 33920, "loss": 0.3764, "lr": 5.187605037114129e-08, "epoch": 19.17452830188679, "percentage": 95.87, "elapsed_time": "1:03:06", "remaining_time": "0:02:43", "throughput": 5652.64, "total_tokens": 21406352} +{"current_steps": 32525, "total_steps": 33920, "loss": 0.2558, "lr": 5.15070682930735e-08, "epoch": 19.17747641509434, "percentage": 95.89, "elapsed_time": "1:03:07", "remaining_time": "0:02:42", "throughput": 5652.66, "total_tokens": 21409584} +{"current_steps": 32530, "total_steps": 33920, "loss": 0.3528, "lr": 5.113939634983578e-08, "epoch": 19.180424528301888, "percentage": 95.9, "elapsed_time": "1:03:08", "remaining_time": "0:02:41", "throughput": 5652.59, "total_tokens": 21413168} +{"current_steps": 32535, "total_steps": 33920, "loss": 0.2476, "lr": 5.077303463877192e-08, "epoch": 19.183372641509433, "percentage": 95.92, "elapsed_time": "1:03:08", "remaining_time": "0:02:41", "throughput": 5652.63, "total_tokens": 21416848} +{"current_steps": 32540, "total_steps": 33920, "loss": 0.374, "lr": 5.040798325687601e-08, "epoch": 19.18632075471698, "percentage": 95.93, "elapsed_time": "1:03:09", "remaining_time": "0:02:40", "throughput": 5652.69, "total_tokens": 21420016} +{"current_steps": 32545, "total_steps": 33920, "loss": 0.2976, "lr": 5.004424230079852e-08, "epoch": 19.18926886792453, "percentage": 95.95, "elapsed_time": "1:03:10", "remaining_time": "0:02:40", "throughput": 5652.85, "total_tokens": 21424656} +{"current_steps": 32550, "total_steps": 33920, "loss": 0.3522, "lr": 4.968181186684129e-08, "epoch": 19.192216981132077, "percentage": 95.96, "elapsed_time": "1:03:10", "remaining_time": "0:02:39", "throughput": 5652.82, "total_tokens": 21427664} +{"current_steps": 32555, "total_steps": 33920, "loss": 0.3396, "lr": 4.932069205095924e-08, "epoch": 19.19516509433962, "percentage": 95.98, "elapsed_time": "1:03:11", "remaining_time": "0:02:38", "throughput": 5652.77, "total_tokens": 21430448} +{"current_steps": 32560, "total_steps": 33920, "loss": 0.3152, "lr": 4.896088294875978e-08, "epoch": 19.19811320754717, "percentage": 95.99, "elapsed_time": "1:03:11", "remaining_time": "0:02:38", "throughput": 5652.77, "total_tokens": 21433616} +{"current_steps": 32565, "total_steps": 33920, "loss": 0.3001, "lr": 4.8602384655505044e-08, "epoch": 19.201061320754718, "percentage": 96.01, "elapsed_time": "1:03:12", "remaining_time": "0:02:37", "throughput": 5652.73, "total_tokens": 21436496} +{"current_steps": 32570, "total_steps": 33920, "loss": 0.2978, "lr": 4.824519726610744e-08, "epoch": 19.204009433962263, "percentage": 96.02, "elapsed_time": "1:03:12", "remaining_time": "0:02:37", "throughput": 5652.75, "total_tokens": 21439792} +{"current_steps": 32575, "total_steps": 33920, "loss": 0.3449, "lr": 4.7889320875135206e-08, "epoch": 19.20695754716981, "percentage": 96.03, "elapsed_time": "1:03:13", "remaining_time": "0:02:36", "throughput": 5652.73, "total_tokens": 21443024} +{"current_steps": 32580, "total_steps": 33920, "loss": 0.2996, "lr": 4.753475557680742e-08, "epoch": 19.20990566037736, "percentage": 96.05, "elapsed_time": "1:03:13", "remaining_time": "0:02:36", "throughput": 5652.73, "total_tokens": 21446096} +{"current_steps": 32585, "total_steps": 33920, "loss": 0.35, "lr": 4.718150146499734e-08, "epoch": 19.212853773584907, "percentage": 96.06, "elapsed_time": "1:03:14", "remaining_time": "0:02:35", "throughput": 5652.91, "total_tokens": 21450480} +{"current_steps": 32590, "total_steps": 33920, "loss": 0.2721, "lr": 4.682955863323013e-08, "epoch": 19.215801886792452, "percentage": 96.08, "elapsed_time": "1:03:15", "remaining_time": "0:02:34", "throughput": 5652.86, "total_tokens": 21453360} +{"current_steps": 32595, "total_steps": 33920, "loss": 0.3261, "lr": 4.6478927174684606e-08, "epoch": 19.21875, "percentage": 96.09, "elapsed_time": "1:03:15", "remaining_time": "0:02:34", "throughput": 5652.81, "total_tokens": 21456112} +{"current_steps": 32600, "total_steps": 33920, "loss": 0.3093, "lr": 4.612960718219095e-08, "epoch": 19.221698113207548, "percentage": 96.11, "elapsed_time": "1:03:16", "remaining_time": "0:02:33", "throughput": 5652.77, "total_tokens": 21458864} +{"current_steps": 32605, "total_steps": 33920, "loss": 0.2758, "lr": 4.578159874823407e-08, "epoch": 19.224646226415093, "percentage": 96.12, "elapsed_time": "1:03:16", "remaining_time": "0:02:33", "throughput": 5652.78, "total_tokens": 21462192} +{"current_steps": 32610, "total_steps": 33920, "loss": 0.2303, "lr": 4.5434901964950264e-08, "epoch": 19.22759433962264, "percentage": 96.14, "elapsed_time": "1:03:17", "remaining_time": "0:02:32", "throughput": 5652.82, "total_tokens": 21465328} +{"current_steps": 32615, "total_steps": 33920, "loss": 0.3314, "lr": 4.508951692412944e-08, "epoch": 19.23054245283019, "percentage": 96.15, "elapsed_time": "1:03:17", "remaining_time": "0:02:31", "throughput": 5652.82, "total_tokens": 21468752} +{"current_steps": 32620, "total_steps": 33920, "loss": 0.1805, "lr": 4.4745443717213455e-08, "epoch": 19.233490566037737, "percentage": 96.17, "elapsed_time": "1:03:18", "remaining_time": "0:02:31", "throughput": 5652.71, "total_tokens": 21471696} +{"current_steps": 32625, "total_steps": 33920, "loss": 0.3073, "lr": 4.4402682435296666e-08, "epoch": 19.236438679245282, "percentage": 96.18, "elapsed_time": "1:03:19", "remaining_time": "0:02:30", "throughput": 5652.73, "total_tokens": 21474928} +{"current_steps": 32630, "total_steps": 33920, "loss": 0.328, "lr": 4.406123316912758e-08, "epoch": 19.23938679245283, "percentage": 96.2, "elapsed_time": "1:03:19", "remaining_time": "0:02:30", "throughput": 5652.84, "total_tokens": 21478448} +{"current_steps": 32635, "total_steps": 33920, "loss": 0.3637, "lr": 4.372109600910612e-08, "epoch": 19.24233490566038, "percentage": 96.21, "elapsed_time": "1:03:20", "remaining_time": "0:02:29", "throughput": 5652.81, "total_tokens": 21481456} +{"current_steps": 32640, "total_steps": 33920, "loss": 0.3251, "lr": 4.338227104528414e-08, "epoch": 19.245283018867923, "percentage": 96.23, "elapsed_time": "1:03:20", "remaining_time": "0:02:29", "throughput": 5652.97, "total_tokens": 21486000} +{"current_steps": 32645, "total_steps": 33920, "loss": 0.2865, "lr": 4.304475836736821e-08, "epoch": 19.24823113207547, "percentage": 96.24, "elapsed_time": "1:03:21", "remaining_time": "0:02:28", "throughput": 5653.08, "total_tokens": 21489520} +{"current_steps": 32650, "total_steps": 33920, "loss": 0.3941, "lr": 4.27085580647163e-08, "epoch": 19.25117924528302, "percentage": 96.26, "elapsed_time": "1:03:22", "remaining_time": "0:02:27", "throughput": 5653.1, "total_tokens": 21493104} +{"current_steps": 32655, "total_steps": 33920, "loss": 0.3132, "lr": 4.237367022633776e-08, "epoch": 19.254127358490567, "percentage": 96.27, "elapsed_time": "1:03:22", "remaining_time": "0:02:27", "throughput": 5653.09, "total_tokens": 21496016} +{"current_steps": 32660, "total_steps": 33920, "loss": 0.2877, "lr": 4.204009494089612e-08, "epoch": 19.257075471698112, "percentage": 96.29, "elapsed_time": "1:03:23", "remaining_time": "0:02:26", "throughput": 5653.12, "total_tokens": 21499632} +{"current_steps": 32665, "total_steps": 33920, "loss": 0.2605, "lr": 4.170783229670739e-08, "epoch": 19.26002358490566, "percentage": 96.3, "elapsed_time": "1:03:23", "remaining_time": "0:02:26", "throughput": 5653.16, "total_tokens": 21502736} +{"current_steps": 32670, "total_steps": 33920, "loss": 0.3163, "lr": 4.137688238173898e-08, "epoch": 19.26297169811321, "percentage": 96.31, "elapsed_time": "1:03:24", "remaining_time": "0:02:25", "throughput": 5653.15, "total_tokens": 21506000} +{"current_steps": 32675, "total_steps": 33920, "loss": 0.2895, "lr": 4.104724528361137e-08, "epoch": 19.265919811320753, "percentage": 96.33, "elapsed_time": "1:03:24", "remaining_time": "0:02:24", "throughput": 5653.17, "total_tokens": 21509360} +{"current_steps": 32680, "total_steps": 33920, "loss": 0.274, "lr": 4.071892108959752e-08, "epoch": 19.2688679245283, "percentage": 96.34, "elapsed_time": "1:03:25", "remaining_time": "0:02:24", "throughput": 5653.3, "total_tokens": 21513232} +{"current_steps": 32685, "total_steps": 33920, "loss": 0.4243, "lr": 4.039190988662234e-08, "epoch": 19.27181603773585, "percentage": 96.36, "elapsed_time": "1:03:26", "remaining_time": "0:02:23", "throughput": 5653.29, "total_tokens": 21516592} +{"current_steps": 32690, "total_steps": 33920, "loss": 0.4868, "lr": 4.006621176126435e-08, "epoch": 19.274764150943398, "percentage": 96.37, "elapsed_time": "1:03:26", "remaining_time": "0:02:23", "throughput": 5653.53, "total_tokens": 21522864} +{"current_steps": 32695, "total_steps": 33920, "loss": 0.3448, "lr": 3.974182679975236e-08, "epoch": 19.277712264150942, "percentage": 96.39, "elapsed_time": "1:03:27", "remaining_time": "0:02:22", "throughput": 5653.67, "total_tokens": 21526544} +{"current_steps": 32700, "total_steps": 33920, "loss": 0.3236, "lr": 3.941875508796933e-08, "epoch": 19.28066037735849, "percentage": 96.4, "elapsed_time": "1:03:28", "remaining_time": "0:02:22", "throughput": 5653.68, "total_tokens": 21529936} +{"current_steps": 32705, "total_steps": 33920, "loss": 0.3061, "lr": 3.909699671145017e-08, "epoch": 19.28360849056604, "percentage": 96.42, "elapsed_time": "1:03:28", "remaining_time": "0:02:21", "throughput": 5653.66, "total_tokens": 21533168} +{"current_steps": 32710, "total_steps": 33920, "loss": 0.2455, "lr": 3.87765517553812e-08, "epoch": 19.286556603773583, "percentage": 96.43, "elapsed_time": "1:03:29", "remaining_time": "0:02:20", "throughput": 5653.61, "total_tokens": 21535984} +{"current_steps": 32715, "total_steps": 33920, "loss": 0.3099, "lr": 3.8457420304601756e-08, "epoch": 19.28950471698113, "percentage": 96.45, "elapsed_time": "1:03:29", "remaining_time": "0:02:20", "throughput": 5653.61, "total_tokens": 21538928} +{"current_steps": 32720, "total_steps": 33920, "loss": 0.3078, "lr": 3.813960244360371e-08, "epoch": 19.29245283018868, "percentage": 96.46, "elapsed_time": "1:03:30", "remaining_time": "0:02:19", "throughput": 5653.73, "total_tokens": 21543152} +{"current_steps": 32725, "total_steps": 33920, "loss": 0.3203, "lr": 3.7823098256529744e-08, "epoch": 19.295400943396228, "percentage": 96.48, "elapsed_time": "1:03:30", "remaining_time": "0:02:19", "throughput": 5653.79, "total_tokens": 21546448} +{"current_steps": 32730, "total_steps": 33920, "loss": 0.3431, "lr": 3.750790782717673e-08, "epoch": 19.298349056603772, "percentage": 96.49, "elapsed_time": "1:03:31", "remaining_time": "0:02:18", "throughput": 5653.79, "total_tokens": 21549520} +{"current_steps": 32735, "total_steps": 33920, "loss": 0.3832, "lr": 3.719403123899179e-08, "epoch": 19.30129716981132, "percentage": 96.51, "elapsed_time": "1:03:32", "remaining_time": "0:02:17", "throughput": 5653.63, "total_tokens": 21551888} +{"current_steps": 32740, "total_steps": 33920, "loss": 0.3341, "lr": 3.688146857507624e-08, "epoch": 19.30424528301887, "percentage": 96.52, "elapsed_time": "1:03:32", "remaining_time": "0:02:17", "throughput": 5653.6, "total_tokens": 21554896} +{"current_steps": 32745, "total_steps": 33920, "loss": 0.4191, "lr": 3.657021991818166e-08, "epoch": 19.307193396226417, "percentage": 96.54, "elapsed_time": "1:03:33", "remaining_time": "0:02:16", "throughput": 5653.69, "total_tokens": 21558960} +{"current_steps": 32750, "total_steps": 33920, "loss": 0.2568, "lr": 3.626028535071213e-08, "epoch": 19.31014150943396, "percentage": 96.55, "elapsed_time": "1:03:33", "remaining_time": "0:02:16", "throughput": 5653.62, "total_tokens": 21562064} +{"current_steps": 32755, "total_steps": 33920, "loss": 0.3213, "lr": 3.59516649547248e-08, "epoch": 19.31308962264151, "percentage": 96.57, "elapsed_time": "1:03:34", "remaining_time": "0:02:15", "throughput": 5653.53, "total_tokens": 21564624} +{"current_steps": 32760, "total_steps": 33920, "loss": 0.2942, "lr": 3.564435881192818e-08, "epoch": 19.316037735849058, "percentage": 96.58, "elapsed_time": "1:03:34", "remaining_time": "0:02:15", "throughput": 5653.42, "total_tokens": 21567312} +{"current_steps": 32765, "total_steps": 33920, "loss": 0.284, "lr": 3.5338367003682763e-08, "epoch": 19.318985849056602, "percentage": 96.59, "elapsed_time": "1:03:35", "remaining_time": "0:02:14", "throughput": 5653.34, "total_tokens": 21569904} +{"current_steps": 32770, "total_steps": 33920, "loss": 0.2839, "lr": 3.5033689611000954e-08, "epoch": 19.32193396226415, "percentage": 96.61, "elapsed_time": "1:03:35", "remaining_time": "0:02:13", "throughput": 5653.32, "total_tokens": 21573008} +{"current_steps": 32775, "total_steps": 33920, "loss": 0.5003, "lr": 3.473032671454768e-08, "epoch": 19.3248820754717, "percentage": 96.62, "elapsed_time": "1:03:36", "remaining_time": "0:02:13", "throughput": 5653.34, "total_tokens": 21576240} +{"current_steps": 32780, "total_steps": 33920, "loss": 0.2326, "lr": 3.44282783946398e-08, "epoch": 19.327830188679247, "percentage": 96.64, "elapsed_time": "1:03:37", "remaining_time": "0:02:12", "throughput": 5653.27, "total_tokens": 21578960} +{"current_steps": 32785, "total_steps": 33920, "loss": 0.2679, "lr": 3.4127544731245575e-08, "epoch": 19.33077830188679, "percentage": 96.65, "elapsed_time": "1:03:37", "remaining_time": "0:02:12", "throughput": 5653.25, "total_tokens": 21582128} +{"current_steps": 32790, "total_steps": 33920, "loss": 0.2334, "lr": 3.38281258039852e-08, "epoch": 19.33372641509434, "percentage": 96.67, "elapsed_time": "1:03:38", "remaining_time": "0:02:11", "throughput": 5653.28, "total_tokens": 21585264} +{"current_steps": 32795, "total_steps": 33920, "loss": 0.3433, "lr": 3.353002169213193e-08, "epoch": 19.336674528301888, "percentage": 96.68, "elapsed_time": "1:03:38", "remaining_time": "0:02:10", "throughput": 5653.34, "total_tokens": 21588688} +{"current_steps": 32800, "total_steps": 33920, "loss": 0.3634, "lr": 3.32332324746093e-08, "epoch": 19.339622641509433, "percentage": 96.7, "elapsed_time": "1:03:39", "remaining_time": "0:02:10", "throughput": 5653.45, "total_tokens": 21592720} +{"current_steps": 32805, "total_steps": 33920, "loss": 0.3475, "lr": 3.2937758229994455e-08, "epoch": 19.34257075471698, "percentage": 96.71, "elapsed_time": "1:03:39", "remaining_time": "0:02:09", "throughput": 5653.38, "total_tokens": 21595568} +{"current_steps": 32810, "total_steps": 33920, "loss": 0.3581, "lr": 3.2643599036514815e-08, "epoch": 19.34551886792453, "percentage": 96.73, "elapsed_time": "1:03:40", "remaining_time": "0:02:09", "throughput": 5653.43, "total_tokens": 21599120} +{"current_steps": 32815, "total_steps": 33920, "loss": 0.3286, "lr": 3.2350754972050316e-08, "epoch": 19.348466981132077, "percentage": 96.74, "elapsed_time": "1:03:41", "remaining_time": "0:02:08", "throughput": 5653.62, "total_tokens": 21603600} +{"current_steps": 32820, "total_steps": 33920, "loss": 0.3051, "lr": 3.2059226114132815e-08, "epoch": 19.35141509433962, "percentage": 96.76, "elapsed_time": "1:03:41", "remaining_time": "0:02:08", "throughput": 5653.71, "total_tokens": 21607152} +{"current_steps": 32825, "total_steps": 33920, "loss": 0.3464, "lr": 3.1769012539945575e-08, "epoch": 19.35436320754717, "percentage": 96.77, "elapsed_time": "1:03:42", "remaining_time": "0:02:07", "throughput": 5653.66, "total_tokens": 21609936} +{"current_steps": 32830, "total_steps": 33920, "loss": 0.3146, "lr": 3.1480114326324364e-08, "epoch": 19.357311320754718, "percentage": 96.79, "elapsed_time": "1:03:43", "remaining_time": "0:02:06", "throughput": 5653.77, "total_tokens": 21614384} +{"current_steps": 32835, "total_steps": 33920, "loss": 0.3227, "lr": 3.1192531549756325e-08, "epoch": 19.360259433962263, "percentage": 96.8, "elapsed_time": "1:03:43", "remaining_time": "0:02:06", "throughput": 5653.81, "total_tokens": 21617872} +{"current_steps": 32840, "total_steps": 33920, "loss": 0.3422, "lr": 3.090626428638e-08, "epoch": 19.36320754716981, "percentage": 96.82, "elapsed_time": "1:03:44", "remaining_time": "0:02:05", "throughput": 5653.85, "total_tokens": 21621328} +{"current_steps": 32845, "total_steps": 33920, "loss": 0.3451, "lr": 3.062131261198531e-08, "epoch": 19.36615566037736, "percentage": 96.83, "elapsed_time": "1:03:44", "remaining_time": "0:02:05", "throughput": 5653.86, "total_tokens": 21624432} +{"current_steps": 32850, "total_steps": 33920, "loss": 0.2737, "lr": 3.033767660201525e-08, "epoch": 19.369103773584907, "percentage": 96.85, "elapsed_time": "1:03:45", "remaining_time": "0:02:04", "throughput": 5653.8, "total_tokens": 21627248} +{"current_steps": 32855, "total_steps": 33920, "loss": 0.2994, "lr": 3.005535633156309e-08, "epoch": 19.372051886792452, "percentage": 96.86, "elapsed_time": "1:03:45", "remaining_time": "0:02:04", "throughput": 5653.76, "total_tokens": 21630064} +{"current_steps": 32860, "total_steps": 33920, "loss": 0.2403, "lr": 2.977435187537514e-08, "epoch": 19.375, "percentage": 96.88, "elapsed_time": "1:03:46", "remaining_time": "0:02:03", "throughput": 5653.78, "total_tokens": 21633264} +{"current_steps": 32865, "total_steps": 33920, "loss": 0.2793, "lr": 2.949466330784745e-08, "epoch": 19.377948113207548, "percentage": 96.89, "elapsed_time": "1:03:46", "remaining_time": "0:02:02", "throughput": 5653.84, "total_tokens": 21636656} +{"current_steps": 32870, "total_steps": 33920, "loss": 0.2044, "lr": 2.921629070302967e-08, "epoch": 19.380896226415093, "percentage": 96.9, "elapsed_time": "1:03:47", "remaining_time": "0:02:02", "throughput": 5654.01, "total_tokens": 21640752} +{"current_steps": 32875, "total_steps": 33920, "loss": 0.2555, "lr": 2.893923413462174e-08, "epoch": 19.38384433962264, "percentage": 96.92, "elapsed_time": "1:03:48", "remaining_time": "0:02:01", "throughput": 5654.05, "total_tokens": 21644144} +{"current_steps": 32880, "total_steps": 33920, "loss": 0.3363, "lr": 2.866349367597554e-08, "epoch": 19.38679245283019, "percentage": 96.93, "elapsed_time": "1:03:48", "remaining_time": "0:02:01", "throughput": 5654.01, "total_tokens": 21646928} +{"current_steps": 32885, "total_steps": 33920, "loss": 0.3627, "lr": 2.8389069400094893e-08, "epoch": 19.389740566037737, "percentage": 96.95, "elapsed_time": "1:03:49", "remaining_time": "0:02:00", "throughput": 5653.85, "total_tokens": 21649296} +{"current_steps": 32890, "total_steps": 33920, "loss": 0.1841, "lr": 2.811596137963446e-08, "epoch": 19.392688679245282, "percentage": 96.96, "elapsed_time": "1:03:49", "remaining_time": "0:01:59", "throughput": 5653.77, "total_tokens": 21651984} +{"current_steps": 32895, "total_steps": 33920, "loss": 0.4163, "lr": 2.7844169686900844e-08, "epoch": 19.39563679245283, "percentage": 96.98, "elapsed_time": "1:03:50", "remaining_time": "0:01:59", "throughput": 5653.77, "total_tokens": 21655120} +{"current_steps": 32900, "total_steps": 33920, "loss": 0.2757, "lr": 2.7573694393852047e-08, "epoch": 19.39858490566038, "percentage": 96.99, "elapsed_time": "1:03:50", "remaining_time": "0:01:58", "throughput": 5653.7, "total_tokens": 21658224} +{"current_steps": 32905, "total_steps": 33920, "loss": 0.2021, "lr": 2.7304535572098e-08, "epoch": 19.401533018867923, "percentage": 97.01, "elapsed_time": "1:03:51", "remaining_time": "0:01:58", "throughput": 5653.73, "total_tokens": 21661456} +{"current_steps": 32910, "total_steps": 33920, "loss": 0.3331, "lr": 2.703669329289893e-08, "epoch": 19.40448113207547, "percentage": 97.02, "elapsed_time": "1:03:51", "remaining_time": "0:01:57", "throughput": 5653.69, "total_tokens": 21664272} +{"current_steps": 32915, "total_steps": 33920, "loss": 0.2606, "lr": 2.6770167627167554e-08, "epoch": 19.40742924528302, "percentage": 97.04, "elapsed_time": "1:03:52", "remaining_time": "0:01:57", "throughput": 5653.65, "total_tokens": 21667088} +{"current_steps": 32920, "total_steps": 33920, "loss": 0.4221, "lr": 2.6504958645467426e-08, "epoch": 19.410377358490567, "percentage": 97.05, "elapsed_time": "1:03:52", "remaining_time": "0:01:56", "throughput": 5653.54, "total_tokens": 21669744} +{"current_steps": 32925, "total_steps": 33920, "loss": 0.3385, "lr": 2.6241066418014605e-08, "epoch": 19.413325471698112, "percentage": 97.07, "elapsed_time": "1:03:53", "remaining_time": "0:01:55", "throughput": 5653.55, "total_tokens": 21673008} +{"current_steps": 32930, "total_steps": 33920, "loss": 0.2689, "lr": 2.5978491014674866e-08, "epoch": 19.41627358490566, "percentage": 97.08, "elapsed_time": "1:03:54", "remaining_time": "0:01:55", "throughput": 5653.52, "total_tokens": 21676080} +{"current_steps": 32935, "total_steps": 33920, "loss": 0.2322, "lr": 2.571723250496705e-08, "epoch": 19.41922169811321, "percentage": 97.1, "elapsed_time": "1:03:54", "remaining_time": "0:01:54", "throughput": 5653.49, "total_tokens": 21679216} +{"current_steps": 32940, "total_steps": 33920, "loss": 0.2334, "lr": 2.5457290958059155e-08, "epoch": 19.422169811320753, "percentage": 97.11, "elapsed_time": "1:03:55", "remaining_time": "0:01:54", "throughput": 5653.45, "total_tokens": 21682064} +{"current_steps": 32945, "total_steps": 33920, "loss": 0.3414, "lr": 2.51986664427728e-08, "epoch": 19.4251179245283, "percentage": 97.13, "elapsed_time": "1:03:55", "remaining_time": "0:01:53", "throughput": 5653.41, "total_tokens": 21684912} +{"current_steps": 32950, "total_steps": 33920, "loss": 0.2539, "lr": 2.4941359027579883e-08, "epoch": 19.42806603773585, "percentage": 97.14, "elapsed_time": "1:03:56", "remaining_time": "0:01:52", "throughput": 5653.43, "total_tokens": 21687920} +{"current_steps": 32955, "total_steps": 33920, "loss": 0.2879, "lr": 2.468536878060368e-08, "epoch": 19.431014150943398, "percentage": 97.16, "elapsed_time": "1:03:56", "remaining_time": "0:01:52", "throughput": 5653.41, "total_tokens": 21690864} +{"current_steps": 32960, "total_steps": 33920, "loss": 0.2686, "lr": 2.443069576961832e-08, "epoch": 19.433962264150942, "percentage": 97.17, "elapsed_time": "1:03:57", "remaining_time": "0:01:51", "throughput": 5653.36, "total_tokens": 21693648} +{"current_steps": 32965, "total_steps": 33920, "loss": 0.3295, "lr": 2.4177340062049304e-08, "epoch": 19.43691037735849, "percentage": 97.18, "elapsed_time": "1:03:57", "remaining_time": "0:01:51", "throughput": 5653.38, "total_tokens": 21696976} +{"current_steps": 32970, "total_steps": 33920, "loss": 0.2582, "lr": 2.3925301724974647e-08, "epoch": 19.43985849056604, "percentage": 97.2, "elapsed_time": "1:03:58", "remaining_time": "0:01:50", "throughput": 5653.46, "total_tokens": 21700912} +{"current_steps": 32975, "total_steps": 33920, "loss": 0.1738, "lr": 2.367458082512153e-08, "epoch": 19.442806603773583, "percentage": 97.21, "elapsed_time": "1:03:59", "remaining_time": "0:01:50", "throughput": 5653.45, "total_tokens": 21704112} +{"current_steps": 32980, "total_steps": 33920, "loss": 0.2444, "lr": 2.3425177428870737e-08, "epoch": 19.44575471698113, "percentage": 97.23, "elapsed_time": "1:03:59", "remaining_time": "0:01:49", "throughput": 5653.59, "total_tokens": 21708176} +{"current_steps": 32985, "total_steps": 33920, "loss": 0.2761, "lr": 2.3177091602251677e-08, "epoch": 19.44870283018868, "percentage": 97.24, "elapsed_time": "1:04:00", "remaining_time": "0:01:48", "throughput": 5653.64, "total_tokens": 21711344} +{"current_steps": 32990, "total_steps": 33920, "loss": 0.3634, "lr": 2.2930323410946254e-08, "epoch": 19.451650943396228, "percentage": 97.26, "elapsed_time": "1:04:00", "remaining_time": "0:01:48", "throughput": 5653.58, "total_tokens": 21714096} +{"current_steps": 32995, "total_steps": 33920, "loss": 0.2577, "lr": 2.2684872920287758e-08, "epoch": 19.454599056603772, "percentage": 97.27, "elapsed_time": "1:04:01", "remaining_time": "0:01:47", "throughput": 5653.66, "total_tokens": 21717744} +{"current_steps": 33000, "total_steps": 33920, "loss": 0.4002, "lr": 2.2440740195260323e-08, "epoch": 19.45754716981132, "percentage": 97.29, "elapsed_time": "1:04:01", "remaining_time": "0:01:47", "throughput": 5653.64, "total_tokens": 21720752} +{"current_steps": 33005, "total_steps": 33920, "loss": 0.3104, "lr": 2.219792530049891e-08, "epoch": 19.46049528301887, "percentage": 97.3, "elapsed_time": "1:04:02", "remaining_time": "0:01:46", "throughput": 5653.74, "total_tokens": 21724784} +{"current_steps": 33010, "total_steps": 33920, "loss": 0.2844, "lr": 2.1956428300290434e-08, "epoch": 19.463443396226417, "percentage": 97.32, "elapsed_time": "1:04:03", "remaining_time": "0:01:45", "throughput": 5653.71, "total_tokens": 21727728} +{"current_steps": 33015, "total_steps": 33920, "loss": 0.3298, "lr": 2.1716249258570966e-08, "epoch": 19.46639150943396, "percentage": 97.33, "elapsed_time": "1:04:03", "remaining_time": "0:01:45", "throughput": 5653.7, "total_tokens": 21730960} +{"current_steps": 33020, "total_steps": 33920, "loss": 0.2423, "lr": 2.1477388238930196e-08, "epoch": 19.46933962264151, "percentage": 97.35, "elapsed_time": "1:04:04", "remaining_time": "0:01:44", "throughput": 5653.77, "total_tokens": 21734480} +{"current_steps": 33025, "total_steps": 33920, "loss": 0.2789, "lr": 2.1239845304606988e-08, "epoch": 19.472287735849058, "percentage": 97.36, "elapsed_time": "1:04:04", "remaining_time": "0:01:44", "throughput": 5653.7, "total_tokens": 21737392} +{"current_steps": 33030, "total_steps": 33920, "loss": 0.3375, "lr": 2.100362051849214e-08, "epoch": 19.475235849056602, "percentage": 97.38, "elapsed_time": "1:04:05", "remaining_time": "0:01:43", "throughput": 5653.79, "total_tokens": 21741424} +{"current_steps": 33035, "total_steps": 33920, "loss": 0.3623, "lr": 2.076871394312674e-08, "epoch": 19.47818396226415, "percentage": 97.39, "elapsed_time": "1:04:05", "remaining_time": "0:01:43", "throughput": 5653.82, "total_tokens": 21744560} +{"current_steps": 33040, "total_steps": 33920, "loss": 0.3243, "lr": 2.0535125640703813e-08, "epoch": 19.4811320754717, "percentage": 97.41, "elapsed_time": "1:04:06", "remaining_time": "0:01:42", "throughput": 5653.76, "total_tokens": 21747568} +{"current_steps": 33045, "total_steps": 33920, "loss": 0.2068, "lr": 2.0302855673066667e-08, "epoch": 19.484080188679247, "percentage": 97.42, "elapsed_time": "1:04:07", "remaining_time": "0:01:41", "throughput": 5653.69, "total_tokens": 21750224} +{"current_steps": 33050, "total_steps": 33920, "loss": 0.2446, "lr": 2.0071904101710004e-08, "epoch": 19.48702830188679, "percentage": 97.44, "elapsed_time": "1:04:08", "remaining_time": "0:01:41", "throughput": 5653.88, "total_tokens": 21756432} +{"current_steps": 33055, "total_steps": 33920, "loss": 0.2636, "lr": 1.98422709877788e-08, "epoch": 19.48997641509434, "percentage": 97.45, "elapsed_time": "1:04:08", "remaining_time": "0:01:40", "throughput": 5653.9, "total_tokens": 21759568} +{"current_steps": 33060, "total_steps": 33920, "loss": 0.3139, "lr": 1.961395639206942e-08, "epoch": 19.492924528301888, "percentage": 97.46, "elapsed_time": "1:04:09", "remaining_time": "0:01:40", "throughput": 5653.85, "total_tokens": 21762640} +{"current_steps": 33065, "total_steps": 33920, "loss": 0.2707, "lr": 1.9386960375029628e-08, "epoch": 19.495872641509433, "percentage": 97.48, "elapsed_time": "1:04:09", "remaining_time": "0:01:39", "throughput": 5653.84, "total_tokens": 21765616} +{"current_steps": 33070, "total_steps": 33920, "loss": 0.2647, "lr": 1.9161282996757458e-08, "epoch": 19.49882075471698, "percentage": 97.49, "elapsed_time": "1:04:10", "remaining_time": "0:01:38", "throughput": 5653.93, "total_tokens": 21769552} +{"current_steps": 33075, "total_steps": 33920, "loss": 0.308, "lr": 1.8936924317001225e-08, "epoch": 19.50176886792453, "percentage": 97.51, "elapsed_time": "1:04:10", "remaining_time": "0:01:38", "throughput": 5654.02, "total_tokens": 21772880} +{"current_steps": 33080, "total_steps": 33920, "loss": 0.2911, "lr": 1.8713884395162308e-08, "epoch": 19.504716981132077, "percentage": 97.52, "elapsed_time": "1:04:11", "remaining_time": "0:01:37", "throughput": 5654.06, "total_tokens": 21776208} +{"current_steps": 33085, "total_steps": 33920, "loss": 0.216, "lr": 1.8492163290290132e-08, "epoch": 19.50766509433962, "percentage": 97.54, "elapsed_time": "1:04:11", "remaining_time": "0:01:37", "throughput": 5653.92, "total_tokens": 21778608} +{"current_steps": 33090, "total_steps": 33920, "loss": 0.2731, "lr": 1.827176106108719e-08, "epoch": 19.51061320754717, "percentage": 97.55, "elapsed_time": "1:04:12", "remaining_time": "0:01:36", "throughput": 5653.82, "total_tokens": 21781264} +{"current_steps": 33095, "total_steps": 33920, "loss": 0.3999, "lr": 1.8052677765905137e-08, "epoch": 19.513561320754718, "percentage": 97.57, "elapsed_time": "1:04:13", "remaining_time": "0:01:36", "throughput": 5653.79, "total_tokens": 21784208} +{"current_steps": 33100, "total_steps": 33920, "loss": 0.3224, "lr": 1.783491346274757e-08, "epoch": 19.516509433962263, "percentage": 97.58, "elapsed_time": "1:04:13", "remaining_time": "0:01:35", "throughput": 5653.73, "total_tokens": 21787088} +{"current_steps": 33105, "total_steps": 33920, "loss": 0.2853, "lr": 1.7618468209268936e-08, "epoch": 19.51945754716981, "percentage": 97.6, "elapsed_time": "1:04:14", "remaining_time": "0:01:34", "throughput": 5653.84, "total_tokens": 21790768} +{"current_steps": 33110, "total_steps": 33920, "loss": 0.2907, "lr": 1.7403342062773943e-08, "epoch": 19.52240566037736, "percentage": 97.61, "elapsed_time": "1:04:14", "remaining_time": "0:01:34", "throughput": 5653.78, "total_tokens": 21793488} +{"current_steps": 33115, "total_steps": 33920, "loss": 0.3645, "lr": 1.718953508021759e-08, "epoch": 19.525353773584907, "percentage": 97.63, "elapsed_time": "1:04:15", "remaining_time": "0:01:33", "throughput": 5653.82, "total_tokens": 21796656} +{"current_steps": 33120, "total_steps": 33920, "loss": 0.2268, "lr": 1.6977047318206262e-08, "epoch": 19.528301886792452, "percentage": 97.64, "elapsed_time": "1:04:15", "remaining_time": "0:01:33", "throughput": 5653.78, "total_tokens": 21799600} +{"current_steps": 33125, "total_steps": 33920, "loss": 0.3875, "lr": 1.676587883299774e-08, "epoch": 19.53125, "percentage": 97.66, "elapsed_time": "1:04:16", "remaining_time": "0:01:32", "throughput": 5653.83, "total_tokens": 21802992} +{"current_steps": 33130, "total_steps": 33920, "loss": 0.2487, "lr": 1.655602968049952e-08, "epoch": 19.534198113207548, "percentage": 97.67, "elapsed_time": "1:04:16", "remaining_time": "0:01:31", "throughput": 5653.75, "total_tokens": 21805552} +{"current_steps": 33135, "total_steps": 33920, "loss": 0.5729, "lr": 1.634749991626938e-08, "epoch": 19.537146226415093, "percentage": 97.69, "elapsed_time": "1:04:17", "remaining_time": "0:01:31", "throughput": 5653.59, "total_tokens": 21807856} +{"current_steps": 33140, "total_steps": 33920, "loss": 0.2389, "lr": 1.6140289595517056e-08, "epoch": 19.54009433962264, "percentage": 97.7, "elapsed_time": "1:04:17", "remaining_time": "0:01:30", "throughput": 5653.57, "total_tokens": 21810928} +{"current_steps": 33145, "total_steps": 33920, "loss": 0.278, "lr": 1.5934398773102545e-08, "epoch": 19.54304245283019, "percentage": 97.72, "elapsed_time": "1:04:18", "remaining_time": "0:01:30", "throughput": 5653.43, "total_tokens": 21813296} +{"current_steps": 33150, "total_steps": 33920, "loss": 0.2338, "lr": 1.5729827503536133e-08, "epoch": 19.545990566037737, "percentage": 97.73, "elapsed_time": "1:04:19", "remaining_time": "0:01:29", "throughput": 5653.47, "total_tokens": 21817264} +{"current_steps": 33155, "total_steps": 33920, "loss": 0.4554, "lr": 1.5526575840978942e-08, "epoch": 19.548938679245282, "percentage": 97.74, "elapsed_time": "1:04:19", "remaining_time": "0:01:29", "throughput": 5653.4, "total_tokens": 21820048} +{"current_steps": 33160, "total_steps": 33920, "loss": 0.2952, "lr": 1.532464383924237e-08, "epoch": 19.55188679245283, "percentage": 97.76, "elapsed_time": "1:04:20", "remaining_time": "0:01:28", "throughput": 5653.5, "total_tokens": 21824112} +{"current_steps": 33165, "total_steps": 33920, "loss": 0.3902, "lr": 1.5124031551789208e-08, "epoch": 19.55483490566038, "percentage": 97.77, "elapsed_time": "1:04:20", "remaining_time": "0:01:27", "throughput": 5653.65, "total_tokens": 21828048} +{"current_steps": 33170, "total_steps": 33920, "loss": 0.4169, "lr": 1.4924739031732527e-08, "epoch": 19.557783018867923, "percentage": 97.79, "elapsed_time": "1:04:21", "remaining_time": "0:01:27", "throughput": 5653.64, "total_tokens": 21830928} +{"current_steps": 33175, "total_steps": 33920, "loss": 0.3696, "lr": 1.4726766331835118e-08, "epoch": 19.56073113207547, "percentage": 97.8, "elapsed_time": "1:04:22", "remaining_time": "0:01:26", "throughput": 5653.84, "total_tokens": 21835792} +{"current_steps": 33180, "total_steps": 33920, "loss": 0.2224, "lr": 1.4530113504512278e-08, "epoch": 19.56367924528302, "percentage": 97.82, "elapsed_time": "1:04:22", "remaining_time": "0:01:26", "throughput": 5653.76, "total_tokens": 21838544} +{"current_steps": 33185, "total_steps": 33920, "loss": 0.216, "lr": 1.4334780601827914e-08, "epoch": 19.566627358490567, "percentage": 97.83, "elapsed_time": "1:04:23", "remaining_time": "0:01:25", "throughput": 5653.84, "total_tokens": 21842096} +{"current_steps": 33190, "total_steps": 33920, "loss": 0.3483, "lr": 1.4140767675497325e-08, "epoch": 19.569575471698112, "percentage": 97.85, "elapsed_time": "1:04:23", "remaining_time": "0:01:24", "throughput": 5653.88, "total_tokens": 21845776} +{"current_steps": 33195, "total_steps": 33920, "loss": 0.3862, "lr": 1.394807477688609e-08, "epoch": 19.57252358490566, "percentage": 97.86, "elapsed_time": "1:04:24", "remaining_time": "0:01:24", "throughput": 5653.97, "total_tokens": 21849328} +{"current_steps": 33200, "total_steps": 33920, "loss": 0.2353, "lr": 1.3756701957011177e-08, "epoch": 19.57547169811321, "percentage": 97.88, "elapsed_time": "1:04:24", "remaining_time": "0:01:23", "throughput": 5654.0, "total_tokens": 21852464} +{"current_steps": 33205, "total_steps": 33920, "loss": 0.2538, "lr": 1.3566649266538723e-08, "epoch": 19.578419811320753, "percentage": 97.89, "elapsed_time": "1:04:25", "remaining_time": "0:01:23", "throughput": 5653.91, "total_tokens": 21855056} +{"current_steps": 33210, "total_steps": 33920, "loss": 0.4268, "lr": 1.3377916755786257e-08, "epoch": 19.5813679245283, "percentage": 97.91, "elapsed_time": "1:04:26", "remaining_time": "0:01:22", "throughput": 5653.95, "total_tokens": 21858512} +{"current_steps": 33215, "total_steps": 33920, "loss": 0.3171, "lr": 1.3190504474721588e-08, "epoch": 19.58431603773585, "percentage": 97.92, "elapsed_time": "1:04:26", "remaining_time": "0:01:22", "throughput": 5654.02, "total_tokens": 21862128} +{"current_steps": 33220, "total_steps": 33920, "loss": 0.2404, "lr": 1.3004412472962802e-08, "epoch": 19.587264150943398, "percentage": 97.94, "elapsed_time": "1:04:27", "remaining_time": "0:01:21", "throughput": 5654.0, "total_tokens": 21864944} +{"current_steps": 33225, "total_steps": 33920, "loss": 0.2404, "lr": 1.2819640799778266e-08, "epoch": 19.590212264150942, "percentage": 97.95, "elapsed_time": "1:04:27", "remaining_time": "0:01:20", "throughput": 5653.96, "total_tokens": 21867952} +{"current_steps": 33230, "total_steps": 33920, "loss": 0.3266, "lr": 1.2636189504087737e-08, "epoch": 19.59316037735849, "percentage": 97.97, "elapsed_time": "1:04:28", "remaining_time": "0:01:20", "throughput": 5653.84, "total_tokens": 21870352} +{"current_steps": 33235, "total_steps": 33920, "loss": 0.3808, "lr": 1.2454058634460142e-08, "epoch": 19.59610849056604, "percentage": 97.98, "elapsed_time": "1:04:28", "remaining_time": "0:01:19", "throughput": 5653.87, "total_tokens": 21873488} +{"current_steps": 33240, "total_steps": 33920, "loss": 0.2503, "lr": 1.2273248239115798e-08, "epoch": 19.599056603773583, "percentage": 98.0, "elapsed_time": "1:04:29", "remaining_time": "0:01:19", "throughput": 5653.81, "total_tokens": 21876208} +{"current_steps": 33245, "total_steps": 33920, "loss": 0.3629, "lr": 1.2093758365924746e-08, "epoch": 19.60200471698113, "percentage": 98.01, "elapsed_time": "1:04:29", "remaining_time": "0:01:18", "throughput": 5653.83, "total_tokens": 21879632} +{"current_steps": 33250, "total_steps": 33920, "loss": 0.5949, "lr": 1.1915589062408417e-08, "epoch": 19.60495283018868, "percentage": 98.02, "elapsed_time": "1:04:30", "remaining_time": "0:01:17", "throughput": 5653.81, "total_tokens": 21882576} +{"current_steps": 33255, "total_steps": 33920, "loss": 0.2428, "lr": 1.1738740375736301e-08, "epoch": 19.607900943396228, "percentage": 98.04, "elapsed_time": "1:04:30", "remaining_time": "0:01:17", "throughput": 5653.87, "total_tokens": 21885936} +{"current_steps": 33260, "total_steps": 33920, "loss": 0.2147, "lr": 1.15632123527315e-08, "epoch": 19.610849056603772, "percentage": 98.05, "elapsed_time": "1:04:31", "remaining_time": "0:01:16", "throughput": 5653.71, "total_tokens": 21888400} +{"current_steps": 33265, "total_steps": 33920, "loss": 0.2427, "lr": 1.1389005039865176e-08, "epoch": 19.61379716981132, "percentage": 98.07, "elapsed_time": "1:04:32", "remaining_time": "0:01:16", "throughput": 5653.59, "total_tokens": 21890960} +{"current_steps": 33270, "total_steps": 33920, "loss": 0.2302, "lr": 1.1216118483259875e-08, "epoch": 19.61674528301887, "percentage": 98.08, "elapsed_time": "1:04:32", "remaining_time": "0:01:15", "throughput": 5653.52, "total_tokens": 21893712} +{"current_steps": 33275, "total_steps": 33920, "loss": 0.312, "lr": 1.1044552728687319e-08, "epoch": 19.619693396226417, "percentage": 98.1, "elapsed_time": "1:04:33", "remaining_time": "0:01:15", "throughput": 5653.4, "total_tokens": 21896304} +{"current_steps": 33280, "total_steps": 33920, "loss": 0.1781, "lr": 1.0874307821570618e-08, "epoch": 19.62264150943396, "percentage": 98.11, "elapsed_time": "1:04:33", "remaining_time": "0:01:14", "throughput": 5653.45, "total_tokens": 21899504} +{"current_steps": 33285, "total_steps": 33920, "loss": 0.2039, "lr": 1.0705383806982606e-08, "epoch": 19.62558962264151, "percentage": 98.13, "elapsed_time": "1:04:34", "remaining_time": "0:01:13", "throughput": 5653.4, "total_tokens": 21902448} +{"current_steps": 33290, "total_steps": 33920, "loss": 0.3002, "lr": 1.0537780729646952e-08, "epoch": 19.628537735849058, "percentage": 98.14, "elapsed_time": "1:04:34", "remaining_time": "0:01:13", "throughput": 5653.35, "total_tokens": 21905200} +{"current_steps": 33295, "total_steps": 33920, "loss": 0.2632, "lr": 1.0371498633937605e-08, "epoch": 19.631485849056602, "percentage": 98.16, "elapsed_time": "1:04:35", "remaining_time": "0:01:12", "throughput": 5653.38, "total_tokens": 21908432} +{"current_steps": 33300, "total_steps": 33920, "loss": 0.232, "lr": 1.0206537563877683e-08, "epoch": 19.63443396226415, "percentage": 98.17, "elapsed_time": "1:04:35", "remaining_time": "0:01:12", "throughput": 5653.49, "total_tokens": 21912304} +{"current_steps": 33305, "total_steps": 33920, "loss": 0.3567, "lr": 1.0042897563141695e-08, "epoch": 19.6373820754717, "percentage": 98.19, "elapsed_time": "1:04:36", "remaining_time": "0:01:11", "throughput": 5653.53, "total_tokens": 21915408} +{"current_steps": 33310, "total_steps": 33920, "loss": 0.3008, "lr": 9.88057867505443e-09, "epoch": 19.640330188679247, "percentage": 98.2, "elapsed_time": "1:04:36", "remaining_time": "0:01:10", "throughput": 5653.48, "total_tokens": 21918288} +{"current_steps": 33315, "total_steps": 33920, "loss": 0.3639, "lr": 9.7195809425904e-09, "epoch": 19.64327830188679, "percentage": 98.22, "elapsed_time": "1:04:37", "remaining_time": "0:01:10", "throughput": 5653.58, "total_tokens": 21922480} +{"current_steps": 33320, "total_steps": 33920, "loss": 0.3291, "lr": 9.559904408373844e-09, "epoch": 19.64622641509434, "percentage": 98.23, "elapsed_time": "1:04:38", "remaining_time": "0:01:09", "throughput": 5653.52, "total_tokens": 21925136} +{"current_steps": 33325, "total_steps": 33920, "loss": 0.2658, "lr": 9.401549114680387e-09, "epoch": 19.649174528301888, "percentage": 98.25, "elapsed_time": "1:04:38", "remaining_time": "0:01:09", "throughput": 5653.66, "total_tokens": 21929296} +{"current_steps": 33330, "total_steps": 33920, "loss": 0.4028, "lr": 9.244515103434826e-09, "epoch": 19.652122641509433, "percentage": 98.26, "elapsed_time": "1:04:39", "remaining_time": "0:01:08", "throughput": 5653.55, "total_tokens": 21932048} +{"current_steps": 33335, "total_steps": 33920, "loss": 0.3923, "lr": 9.08880241621335e-09, "epoch": 19.65507075471698, "percentage": 98.28, "elapsed_time": "1:04:40", "remaining_time": "0:01:08", "throughput": 5653.93, "total_tokens": 21941648} +{"current_steps": 33340, "total_steps": 33920, "loss": 0.2242, "lr": 8.934411094240758e-09, "epoch": 19.65801886792453, "percentage": 98.29, "elapsed_time": "1:04:41", "remaining_time": "0:01:07", "throughput": 5654.01, "total_tokens": 21945680} +{"current_steps": 33345, "total_steps": 33920, "loss": 0.2329, "lr": 8.781341178393244e-09, "epoch": 19.660966981132077, "percentage": 98.3, "elapsed_time": "1:04:42", "remaining_time": "0:01:06", "throughput": 5654.2, "total_tokens": 21949936} +{"current_steps": 33350, "total_steps": 33920, "loss": 0.2693, "lr": 8.629592709196167e-09, "epoch": 19.66391509433962, "percentage": 98.32, "elapsed_time": "1:04:42", "remaining_time": "0:01:06", "throughput": 5654.19, "total_tokens": 21952944} +{"current_steps": 33355, "total_steps": 33920, "loss": 0.2872, "lr": 8.479165726826277e-09, "epoch": 19.66686320754717, "percentage": 98.33, "elapsed_time": "1:04:43", "remaining_time": "0:01:05", "throughput": 5654.13, "total_tokens": 21955632} +{"current_steps": 33360, "total_steps": 33920, "loss": 0.2962, "lr": 8.330060271109496e-09, "epoch": 19.669811320754718, "percentage": 98.35, "elapsed_time": "1:04:43", "remaining_time": "0:01:05", "throughput": 5654.22, "total_tokens": 21959088} +{"current_steps": 33365, "total_steps": 33920, "loss": 0.2854, "lr": 8.18227638152258e-09, "epoch": 19.672759433962263, "percentage": 98.36, "elapsed_time": "1:04:44", "remaining_time": "0:01:04", "throughput": 5654.29, "total_tokens": 21962544} +{"current_steps": 33370, "total_steps": 33920, "loss": 0.2024, "lr": 8.035814097191452e-09, "epoch": 19.67570754716981, "percentage": 98.38, "elapsed_time": "1:04:44", "remaining_time": "0:01:04", "throughput": 5654.29, "total_tokens": 21965808} +{"current_steps": 33375, "total_steps": 33920, "loss": 0.302, "lr": 7.890673456892317e-09, "epoch": 19.67865566037736, "percentage": 98.39, "elapsed_time": "1:04:45", "remaining_time": "0:01:03", "throughput": 5654.32, "total_tokens": 21969232} +{"current_steps": 33380, "total_steps": 33920, "loss": 0.3199, "lr": 7.746854499052215e-09, "epoch": 19.681603773584907, "percentage": 98.41, "elapsed_time": "1:04:45", "remaining_time": "0:01:02", "throughput": 5654.44, "total_tokens": 21973008} +{"current_steps": 33385, "total_steps": 33920, "loss": 0.3323, "lr": 7.604357261747907e-09, "epoch": 19.684551886792452, "percentage": 98.42, "elapsed_time": "1:04:46", "remaining_time": "0:01:02", "throughput": 5654.39, "total_tokens": 21975888} +{"current_steps": 33390, "total_steps": 33920, "loss": 0.2802, "lr": 7.463181782705886e-09, "epoch": 19.6875, "percentage": 98.44, "elapsed_time": "1:04:47", "remaining_time": "0:01:01", "throughput": 5654.38, "total_tokens": 21978960} +{"current_steps": 33395, "total_steps": 33920, "loss": 0.5767, "lr": 7.3233280993034726e-09, "epoch": 19.690448113207548, "percentage": 98.45, "elapsed_time": "1:04:47", "remaining_time": "0:01:01", "throughput": 5654.38, "total_tokens": 21982096} +{"current_steps": 33400, "total_steps": 33920, "loss": 0.2984, "lr": 7.184796248567161e-09, "epoch": 19.693396226415093, "percentage": 98.47, "elapsed_time": "1:04:48", "remaining_time": "0:01:00", "throughput": 5654.56, "total_tokens": 21986480} +{"current_steps": 33405, "total_steps": 33920, "loss": 0.1844, "lr": 7.047586267173723e-09, "epoch": 19.69634433962264, "percentage": 98.48, "elapsed_time": "1:04:48", "remaining_time": "0:00:59", "throughput": 5654.52, "total_tokens": 21989328} +{"current_steps": 33410, "total_steps": 33920, "loss": 0.3878, "lr": 6.9116981914502114e-09, "epoch": 19.69929245283019, "percentage": 98.5, "elapsed_time": "1:04:49", "remaining_time": "0:00:59", "throughput": 5654.64, "total_tokens": 21993840} +{"current_steps": 33415, "total_steps": 33920, "loss": 0.2825, "lr": 6.7771320573734036e-09, "epoch": 19.702240566037737, "percentage": 98.51, "elapsed_time": "1:04:50", "remaining_time": "0:00:58", "throughput": 5654.63, "total_tokens": 21996944} +{"current_steps": 33420, "total_steps": 33920, "loss": 0.2576, "lr": 6.6438879005709114e-09, "epoch": 19.705188679245282, "percentage": 98.53, "elapsed_time": "1:04:50", "remaining_time": "0:00:58", "throughput": 5654.71, "total_tokens": 22001392} +{"current_steps": 33425, "total_steps": 33920, "loss": 0.3424, "lr": 6.511965756318961e-09, "epoch": 19.70813679245283, "percentage": 98.54, "elapsed_time": "1:04:51", "remaining_time": "0:00:57", "throughput": 5654.62, "total_tokens": 22004336} +{"current_steps": 33430, "total_steps": 33920, "loss": 0.3734, "lr": 6.381365659545169e-09, "epoch": 19.71108490566038, "percentage": 98.56, "elapsed_time": "1:04:51", "remaining_time": "0:00:57", "throughput": 5654.48, "total_tokens": 22006768} +{"current_steps": 33435, "total_steps": 33920, "loss": 0.3722, "lr": 6.252087644825766e-09, "epoch": 19.714033018867923, "percentage": 98.57, "elapsed_time": "1:04:52", "remaining_time": "0:00:56", "throughput": 5654.51, "total_tokens": 22010160} +{"current_steps": 33440, "total_steps": 33920, "loss": 0.2388, "lr": 6.124131746388373e-09, "epoch": 19.71698113207547, "percentage": 98.58, "elapsed_time": "1:04:53", "remaining_time": "0:00:55", "throughput": 5654.59, "total_tokens": 22013648} +{"current_steps": 33445, "total_steps": 33920, "loss": 0.2748, "lr": 5.997497998109225e-09, "epoch": 19.71992924528302, "percentage": 98.6, "elapsed_time": "1:04:53", "remaining_time": "0:00:55", "throughput": 5654.51, "total_tokens": 22016240} +{"current_steps": 33450, "total_steps": 33920, "loss": 0.2211, "lr": 5.8721864335153925e-09, "epoch": 19.722877358490567, "percentage": 98.61, "elapsed_time": "1:04:54", "remaining_time": "0:00:54", "throughput": 5654.53, "total_tokens": 22019376} +{"current_steps": 33455, "total_steps": 33920, "loss": 0.2945, "lr": 5.748197085784224e-09, "epoch": 19.725825471698112, "percentage": 98.63, "elapsed_time": "1:04:54", "remaining_time": "0:00:54", "throughput": 5654.53, "total_tokens": 22022416} +{"current_steps": 33460, "total_steps": 33920, "loss": 0.216, "lr": 5.62552998774113e-09, "epoch": 19.72877358490566, "percentage": 98.64, "elapsed_time": "1:04:55", "remaining_time": "0:00:53", "throughput": 5654.58, "total_tokens": 22026064} +{"current_steps": 33465, "total_steps": 33920, "loss": 0.3391, "lr": 5.504185171864018e-09, "epoch": 19.73172169811321, "percentage": 98.66, "elapsed_time": "1:04:55", "remaining_time": "0:00:52", "throughput": 5654.55, "total_tokens": 22028816} +{"current_steps": 33470, "total_steps": 33920, "loss": 0.3647, "lr": 5.384162670278858e-09, "epoch": 19.734669811320753, "percentage": 98.67, "elapsed_time": "1:04:56", "remaining_time": "0:00:52", "throughput": 5654.59, "total_tokens": 22032432} +{"current_steps": 33475, "total_steps": 33920, "loss": 0.3746, "lr": 5.265462514762454e-09, "epoch": 19.7376179245283, "percentage": 98.69, "elapsed_time": "1:04:57", "remaining_time": "0:00:51", "throughput": 5654.64, "total_tokens": 22036528} +{"current_steps": 33480, "total_steps": 33920, "loss": 0.3347, "lr": 5.148084736740777e-09, "epoch": 19.74056603773585, "percentage": 98.7, "elapsed_time": "1:04:57", "remaining_time": "0:00:51", "throughput": 5654.62, "total_tokens": 22039632} +{"current_steps": 33485, "total_steps": 33920, "loss": 0.3137, "lr": 5.032029367290081e-09, "epoch": 19.743514150943398, "percentage": 98.72, "elapsed_time": "1:04:58", "remaining_time": "0:00:50", "throughput": 5654.57, "total_tokens": 22042672} +{"current_steps": 33490, "total_steps": 33920, "loss": 0.3739, "lr": 4.917296437136898e-09, "epoch": 19.746462264150942, "percentage": 98.73, "elapsed_time": "1:04:58", "remaining_time": "0:00:50", "throughput": 5654.65, "total_tokens": 22045968} +{"current_steps": 33495, "total_steps": 33920, "loss": 0.3236, "lr": 4.8038859766569305e-09, "epoch": 19.74941037735849, "percentage": 98.75, "elapsed_time": "1:04:59", "remaining_time": "0:00:49", "throughput": 5654.68, "total_tokens": 22049680} +{"current_steps": 33500, "total_steps": 33920, "loss": 0.2395, "lr": 4.691798015876714e-09, "epoch": 19.75235849056604, "percentage": 98.76, "elapsed_time": "1:04:59", "remaining_time": "0:00:48", "throughput": 5654.74, "total_tokens": 22053104} +{"current_steps": 33505, "total_steps": 33920, "loss": 0.2529, "lr": 4.581032584470846e-09, "epoch": 19.755306603773583, "percentage": 98.78, "elapsed_time": "1:05:00", "remaining_time": "0:00:48", "throughput": 5654.72, "total_tokens": 22056304} +{"current_steps": 33510, "total_steps": 33920, "loss": 0.3302, "lr": 4.471589711766422e-09, "epoch": 19.75825471698113, "percentage": 98.79, "elapsed_time": "1:05:01", "remaining_time": "0:00:47", "throughput": 5654.83, "total_tokens": 22060144} +{"current_steps": 33515, "total_steps": 33920, "loss": 0.2151, "lr": 4.363469426737487e-09, "epoch": 19.76120283018868, "percentage": 98.81, "elapsed_time": "1:05:01", "remaining_time": "0:00:47", "throughput": 5654.71, "total_tokens": 22062960} +{"current_steps": 33520, "total_steps": 33920, "loss": 0.2887, "lr": 4.256671758010588e-09, "epoch": 19.764150943396228, "percentage": 98.82, "elapsed_time": "1:05:02", "remaining_time": "0:00:46", "throughput": 5654.69, "total_tokens": 22065776} +{"current_steps": 33525, "total_steps": 33920, "loss": 0.2253, "lr": 4.151196733859775e-09, "epoch": 19.767099056603772, "percentage": 98.84, "elapsed_time": "1:05:02", "remaining_time": "0:00:45", "throughput": 5654.8, "total_tokens": 22070000} +{"current_steps": 33530, "total_steps": 33920, "loss": 0.24, "lr": 4.047044382211041e-09, "epoch": 19.77004716981132, "percentage": 98.85, "elapsed_time": "1:05:03", "remaining_time": "0:00:45", "throughput": 5654.84, "total_tokens": 22073264} +{"current_steps": 33535, "total_steps": 33920, "loss": 0.2669, "lr": 3.94421473063844e-09, "epoch": 19.77299528301887, "percentage": 98.86, "elapsed_time": "1:05:04", "remaining_time": "0:00:44", "throughput": 5654.81, "total_tokens": 22076368} +{"current_steps": 33540, "total_steps": 33920, "loss": 0.4777, "lr": 3.842707806366863e-09, "epoch": 19.775943396226417, "percentage": 98.88, "elapsed_time": "1:05:04", "remaining_time": "0:00:44", "throughput": 5654.82, "total_tokens": 22079632} +{"current_steps": 33545, "total_steps": 33920, "loss": 0.3285, "lr": 3.742523636270368e-09, "epoch": 19.77889150943396, "percentage": 98.89, "elapsed_time": "1:05:05", "remaining_time": "0:00:43", "throughput": 5654.8, "total_tokens": 22082512} +{"current_steps": 33550, "total_steps": 33920, "loss": 0.2789, "lr": 3.6436622468738468e-09, "epoch": 19.78183962264151, "percentage": 98.91, "elapsed_time": "1:05:05", "remaining_time": "0:00:43", "throughput": 5654.94, "total_tokens": 22086896} +{"current_steps": 33555, "total_steps": 33920, "loss": 0.3315, "lr": 3.546123664350254e-09, "epoch": 19.784787735849058, "percentage": 98.92, "elapsed_time": "1:05:06", "remaining_time": "0:00:42", "throughput": 5654.85, "total_tokens": 22089456} +{"current_steps": 33560, "total_steps": 33920, "loss": 0.248, "lr": 3.449907914524486e-09, "epoch": 19.787735849056602, "percentage": 98.94, "elapsed_time": "1:05:06", "remaining_time": "0:00:41", "throughput": 5654.85, "total_tokens": 22092496} +{"current_steps": 33565, "total_steps": 33920, "loss": 0.2253, "lr": 3.355015022869501e-09, "epoch": 19.79068396226415, "percentage": 98.95, "elapsed_time": "1:05:07", "remaining_time": "0:00:41", "throughput": 5654.77, "total_tokens": 22095216} +{"current_steps": 33570, "total_steps": 33920, "loss": 0.3973, "lr": 3.261445014508535e-09, "epoch": 19.7936320754717, "percentage": 98.97, "elapsed_time": "1:05:07", "remaining_time": "0:00:40", "throughput": 5654.64, "total_tokens": 22097872} +{"current_steps": 33575, "total_steps": 33920, "loss": 0.2419, "lr": 3.1691979142145503e-09, "epoch": 19.796580188679247, "percentage": 98.98, "elapsed_time": "1:05:08", "remaining_time": "0:00:40", "throughput": 5654.61, "total_tokens": 22100624} +{"current_steps": 33580, "total_steps": 33920, "loss": 0.3073, "lr": 3.078273746410787e-09, "epoch": 19.79952830188679, "percentage": 99.0, "elapsed_time": "1:05:09", "remaining_time": "0:00:39", "throughput": 5654.77, "total_tokens": 22105808} +{"current_steps": 33585, "total_steps": 33920, "loss": 0.426, "lr": 2.988672535169657e-09, "epoch": 19.80247641509434, "percentage": 99.01, "elapsed_time": "1:05:10", "remaining_time": "0:00:39", "throughput": 5654.85, "total_tokens": 22112336} +{"current_steps": 33590, "total_steps": 33920, "loss": 0.3055, "lr": 2.9003943042127393e-09, "epoch": 19.805424528301888, "percentage": 99.03, "elapsed_time": "1:05:10", "remaining_time": "0:00:38", "throughput": 5654.7, "total_tokens": 22114736} +{"current_steps": 33595, "total_steps": 33920, "loss": 0.2263, "lr": 2.8134390769135598e-09, "epoch": 19.808372641509433, "percentage": 99.04, "elapsed_time": "1:05:11", "remaining_time": "0:00:37", "throughput": 5654.66, "total_tokens": 22117680} +{"current_steps": 33600, "total_steps": 33920, "loss": 0.3221, "lr": 2.7278068762925935e-09, "epoch": 19.81132075471698, "percentage": 99.06, "elapsed_time": "1:05:11", "remaining_time": "0:00:37", "throughput": 5654.56, "total_tokens": 22120432} +{"current_steps": 33605, "total_steps": 33920, "loss": 0.2959, "lr": 2.6434977250217043e-09, "epoch": 19.81426886792453, "percentage": 99.07, "elapsed_time": "1:05:12", "remaining_time": "0:00:36", "throughput": 5654.6, "total_tokens": 22124080} +{"current_steps": 33610, "total_steps": 33920, "loss": 0.3205, "lr": 2.560511645422481e-09, "epoch": 19.817216981132077, "percentage": 99.09, "elapsed_time": "1:05:13", "remaining_time": "0:00:36", "throughput": 5654.56, "total_tokens": 22127184} +{"current_steps": 33615, "total_steps": 33920, "loss": 0.2803, "lr": 2.4788486594656825e-09, "epoch": 19.82016509433962, "percentage": 99.1, "elapsed_time": "1:05:13", "remaining_time": "0:00:35", "throughput": 5654.62, "total_tokens": 22130704} +{"current_steps": 33620, "total_steps": 33920, "loss": 0.3116, "lr": 2.398508788771792e-09, "epoch": 19.82311320754717, "percentage": 99.12, "elapsed_time": "1:05:14", "remaining_time": "0:00:34", "throughput": 5654.57, "total_tokens": 22133648} +{"current_steps": 33625, "total_steps": 33920, "loss": 0.3171, "lr": 2.3194920546110166e-09, "epoch": 19.826061320754718, "percentage": 99.13, "elapsed_time": "1:05:14", "remaining_time": "0:00:34", "throughput": 5654.68, "total_tokens": 22137712} +{"current_steps": 33630, "total_steps": 33920, "loss": 0.3506, "lr": 2.2417984779032896e-09, "epoch": 19.829009433962263, "percentage": 99.15, "elapsed_time": "1:05:15", "remaining_time": "0:00:33", "throughput": 5654.84, "total_tokens": 22142192} +{"current_steps": 33635, "total_steps": 33920, "loss": 0.274, "lr": 2.1654280792193782e-09, "epoch": 19.83195754716981, "percentage": 99.16, "elapsed_time": "1:05:16", "remaining_time": "0:00:33", "throughput": 5655.04, "total_tokens": 22146864} +{"current_steps": 33640, "total_steps": 33920, "loss": 0.3359, "lr": 2.0903808787769987e-09, "epoch": 19.83490566037736, "percentage": 99.17, "elapsed_time": "1:05:16", "remaining_time": "0:00:32", "throughput": 5655.15, "total_tokens": 22150704} +{"current_steps": 33645, "total_steps": 33920, "loss": 0.2749, "lr": 2.0166568964463673e-09, "epoch": 19.837853773584907, "percentage": 99.19, "elapsed_time": "1:05:17", "remaining_time": "0:00:32", "throughput": 5655.14, "total_tokens": 22153968} +{"current_steps": 33650, "total_steps": 33920, "loss": 0.254, "lr": 1.9442561517463153e-09, "epoch": 19.840801886792452, "percentage": 99.2, "elapsed_time": "1:05:18", "remaining_time": "0:00:31", "throughput": 5655.12, "total_tokens": 22157424} +{"current_steps": 33655, "total_steps": 33920, "loss": 0.2873, "lr": 1.8731786638442886e-09, "epoch": 19.84375, "percentage": 99.22, "elapsed_time": "1:05:18", "remaining_time": "0:00:30", "throughput": 5655.14, "total_tokens": 22162096} +{"current_steps": 33660, "total_steps": 33920, "loss": 0.279, "lr": 1.8034244515591214e-09, "epoch": 19.846698113207548, "percentage": 99.23, "elapsed_time": "1:05:19", "remaining_time": "0:00:30", "throughput": 5654.95, "total_tokens": 22164336} +{"current_steps": 33665, "total_steps": 33920, "loss": 0.2844, "lr": 1.7349935333582646e-09, "epoch": 19.849646226415093, "percentage": 99.25, "elapsed_time": "1:05:20", "remaining_time": "0:00:29", "throughput": 5654.98, "total_tokens": 22167536} +{"current_steps": 33670, "total_steps": 33920, "loss": 0.241, "lr": 1.6678859273594471e-09, "epoch": 19.85259433962264, "percentage": 99.26, "elapsed_time": "1:05:20", "remaining_time": "0:00:29", "throughput": 5654.89, "total_tokens": 22170096} +{"current_steps": 33675, "total_steps": 33920, "loss": 0.3039, "lr": 1.6021016513295683e-09, "epoch": 19.85554245283019, "percentage": 99.28, "elapsed_time": "1:05:21", "remaining_time": "0:00:28", "throughput": 5654.77, "total_tokens": 22172624} +{"current_steps": 33680, "total_steps": 33920, "loss": 0.2798, "lr": 1.5376407226846968e-09, "epoch": 19.858490566037737, "percentage": 99.29, "elapsed_time": "1:05:21", "remaining_time": "0:00:27", "throughput": 5654.56, "total_tokens": 22174832} +{"current_steps": 33685, "total_steps": 33920, "loss": 0.3391, "lr": 1.4745031584917357e-09, "epoch": 19.861438679245282, "percentage": 99.31, "elapsed_time": "1:05:22", "remaining_time": "0:00:27", "throughput": 5654.56, "total_tokens": 22177936} +{"current_steps": 33690, "total_steps": 33920, "loss": 0.3127, "lr": 1.4126889754667583e-09, "epoch": 19.86438679245283, "percentage": 99.32, "elapsed_time": "1:05:22", "remaining_time": "0:00:26", "throughput": 5654.67, "total_tokens": 22181648} +{"current_steps": 33695, "total_steps": 33920, "loss": 0.3793, "lr": 1.3521981899750069e-09, "epoch": 19.86733490566038, "percentage": 99.34, "elapsed_time": "1:05:23", "remaining_time": "0:00:26", "throughput": 5654.73, "total_tokens": 22185232} +{"current_steps": 33700, "total_steps": 33920, "loss": 0.1927, "lr": 1.293030818032004e-09, "epoch": 19.870283018867923, "percentage": 99.35, "elapsed_time": "1:05:23", "remaining_time": "0:00:25", "throughput": 5654.81, "total_tokens": 22188656} +{"current_steps": 33705, "total_steps": 33920, "loss": 0.1966, "lr": 1.2351868753018858e-09, "epoch": 19.87323113207547, "percentage": 99.37, "elapsed_time": "1:05:24", "remaining_time": "0:00:25", "throughput": 5654.83, "total_tokens": 22191600} +{"current_steps": 33710, "total_steps": 33920, "loss": 0.2975, "lr": 1.1786663770996242e-09, "epoch": 19.87617924528302, "percentage": 99.38, "elapsed_time": "1:05:24", "remaining_time": "0:00:24", "throughput": 5654.87, "total_tokens": 22195120} +{"current_steps": 33715, "total_steps": 33920, "loss": 0.2904, "lr": 1.1234693383893602e-09, "epoch": 19.879127358490567, "percentage": 99.4, "elapsed_time": "1:05:25", "remaining_time": "0:00:23", "throughput": 5654.95, "total_tokens": 22198928} +{"current_steps": 33720, "total_steps": 33920, "loss": 0.2771, "lr": 1.0695957737844043e-09, "epoch": 19.882075471698112, "percentage": 99.41, "elapsed_time": "1:05:26", "remaining_time": "0:00:23", "throughput": 5654.93, "total_tokens": 22201904} +{"current_steps": 33725, "total_steps": 33920, "loss": 0.4274, "lr": 1.0170456975483467e-09, "epoch": 19.88502358490566, "percentage": 99.43, "elapsed_time": "1:05:26", "remaining_time": "0:00:22", "throughput": 5654.91, "total_tokens": 22205104} +{"current_steps": 33730, "total_steps": 33920, "loss": 0.3181, "lr": 9.658191235933922e-10, "epoch": 19.88797169811321, "percentage": 99.44, "elapsed_time": "1:05:27", "remaining_time": "0:00:22", "throughput": 5654.86, "total_tokens": 22208400} +{"current_steps": 33735, "total_steps": 33920, "loss": 0.25, "lr": 9.159160654825805e-10, "epoch": 19.890919811320753, "percentage": 99.45, "elapsed_time": "1:05:27", "remaining_time": "0:00:21", "throughput": 5655.03, "total_tokens": 22212816} +{"current_steps": 33740, "total_steps": 33920, "loss": 0.3072, "lr": 8.673365364281205e-10, "epoch": 19.8938679245283, "percentage": 99.47, "elapsed_time": "1:05:28", "remaining_time": "0:00:20", "throughput": 5655.03, "total_tokens": 22215824} +{"current_steps": 33745, "total_steps": 33920, "loss": 0.1986, "lr": 8.200805492913911e-10, "epoch": 19.89681603773585, "percentage": 99.48, "elapsed_time": "1:05:29", "remaining_time": "0:00:20", "throughput": 5654.91, "total_tokens": 22218352} +{"current_steps": 33750, "total_steps": 33920, "loss": 0.2853, "lr": 7.741481165834952e-10, "epoch": 19.899764150943398, "percentage": 99.5, "elapsed_time": "1:05:29", "remaining_time": "0:00:19", "throughput": 5654.92, "total_tokens": 22222096} +{"current_steps": 33755, "total_steps": 33920, "loss": 0.2518, "lr": 7.29539250465261e-10, "epoch": 19.902712264150942, "percentage": 99.51, "elapsed_time": "1:05:30", "remaining_time": "0:00:19", "throughput": 5655.0, "total_tokens": 22225712} +{"current_steps": 33760, "total_steps": 33920, "loss": 0.2716, "lr": 6.862539627472409e-10, "epoch": 19.90566037735849, "percentage": 99.53, "elapsed_time": "1:05:30", "remaining_time": "0:00:18", "throughput": 5655.0, "total_tokens": 22228752} +{"current_steps": 33765, "total_steps": 33920, "loss": 0.4382, "lr": 6.442922648897121e-10, "epoch": 19.90860849056604, "percentage": 99.54, "elapsed_time": "1:05:31", "remaining_time": "0:00:18", "throughput": 5654.85, "total_tokens": 22231088} +{"current_steps": 33770, "total_steps": 33920, "loss": 0.3201, "lr": 6.036541680015662e-10, "epoch": 19.911556603773583, "percentage": 99.56, "elapsed_time": "1:05:31", "remaining_time": "0:00:17", "throughput": 5654.73, "total_tokens": 22233552} +{"current_steps": 33775, "total_steps": 33920, "loss": 0.2174, "lr": 5.643396828419745e-10, "epoch": 19.91450471698113, "percentage": 99.57, "elapsed_time": "1:05:32", "remaining_time": "0:00:16", "throughput": 5654.75, "total_tokens": 22236752} +{"current_steps": 33780, "total_steps": 33920, "loss": 0.2702, "lr": 5.26348819819833e-10, "epoch": 19.91745283018868, "percentage": 99.59, "elapsed_time": "1:05:32", "remaining_time": "0:00:16", "throughput": 5654.84, "total_tokens": 22240272} +{"current_steps": 33785, "total_steps": 33920, "loss": 0.2708, "lr": 4.896815889937622e-10, "epoch": 19.920400943396228, "percentage": 99.6, "elapsed_time": "1:05:33", "remaining_time": "0:00:15", "throughput": 5654.89, "total_tokens": 22243504} +{"current_steps": 33790, "total_steps": 33920, "loss": 0.3351, "lr": 4.543380000704423e-10, "epoch": 19.923349056603772, "percentage": 99.62, "elapsed_time": "1:05:34", "remaining_time": "0:00:15", "throughput": 5654.98, "total_tokens": 22247056} +{"current_steps": 33795, "total_steps": 33920, "loss": 0.3012, "lr": 4.203180624084979e-10, "epoch": 19.92629716981132, "percentage": 99.63, "elapsed_time": "1:05:34", "remaining_time": "0:00:14", "throughput": 5654.86, "total_tokens": 22249616} +{"current_steps": 33800, "total_steps": 33920, "loss": 0.2986, "lr": 3.876217850146136e-10, "epoch": 19.92924528301887, "percentage": 99.65, "elapsed_time": "1:05:35", "remaining_time": "0:00:13", "throughput": 5654.83, "total_tokens": 22252496} +{"current_steps": 33805, "total_steps": 33920, "loss": 0.3177, "lr": 3.56249176544643e-10, "epoch": 19.932193396226417, "percentage": 99.66, "elapsed_time": "1:05:35", "remaining_time": "0:00:13", "throughput": 5654.88, "total_tokens": 22255792} +{"current_steps": 33810, "total_steps": 33920, "loss": 0.26, "lr": 3.262002453047197e-10, "epoch": 19.93514150943396, "percentage": 99.68, "elapsed_time": "1:05:36", "remaining_time": "0:00:12", "throughput": 5654.81, "total_tokens": 22258576} +{"current_steps": 33815, "total_steps": 33920, "loss": 0.3009, "lr": 2.974749992512571e-10, "epoch": 19.93808962264151, "percentage": 99.69, "elapsed_time": "1:05:36", "remaining_time": "0:00:12", "throughput": 5654.66, "total_tokens": 22261328} +{"current_steps": 33820, "total_steps": 33920, "loss": 0.3519, "lr": 2.700734459881726e-10, "epoch": 19.941037735849058, "percentage": 99.71, "elapsed_time": "1:05:37", "remaining_time": "0:00:11", "throughput": 5654.61, "total_tokens": 22264112} +{"current_steps": 33825, "total_steps": 33920, "loss": 0.5742, "lr": 2.439955927713289e-10, "epoch": 19.943985849056602, "percentage": 99.72, "elapsed_time": "1:05:37", "remaining_time": "0:00:11", "throughput": 5654.73, "total_tokens": 22268176} +{"current_steps": 33830, "total_steps": 33920, "loss": 0.2232, "lr": 2.1924144650409263e-10, "epoch": 19.94693396226415, "percentage": 99.73, "elapsed_time": "1:05:38", "remaining_time": "0:00:10", "throughput": 5654.63, "total_tokens": 22271120} +{"current_steps": 33835, "total_steps": 33920, "loss": 0.2776, "lr": 1.9581101374066546e-10, "epoch": 19.9498820754717, "percentage": 99.75, "elapsed_time": "1:05:39", "remaining_time": "0:00:09", "throughput": 5654.47, "total_tokens": 22273424} +{"current_steps": 33840, "total_steps": 33920, "loss": 0.2911, "lr": 1.7370430068441858e-10, "epoch": 19.952830188679247, "percentage": 99.76, "elapsed_time": "1:05:39", "remaining_time": "0:00:09", "throughput": 5654.53, "total_tokens": 22276816} +{"current_steps": 33845, "total_steps": 33920, "loss": 0.4486, "lr": 1.529213131878926e-10, "epoch": 19.95577830188679, "percentage": 99.78, "elapsed_time": "1:05:40", "remaining_time": "0:00:08", "throughput": 5654.57, "total_tokens": 22280016} +{"current_steps": 33850, "total_steps": 33920, "loss": 0.4143, "lr": 1.3346205675335288e-10, "epoch": 19.95872641509434, "percentage": 99.79, "elapsed_time": "1:05:40", "remaining_time": "0:00:08", "throughput": 5654.6, "total_tokens": 22283408} +{"current_steps": 33855, "total_steps": 33920, "loss": 0.2756, "lr": 1.1532653653334447e-10, "epoch": 19.961674528301888, "percentage": 99.81, "elapsed_time": "1:05:41", "remaining_time": "0:00:07", "throughput": 5654.51, "total_tokens": 22286032} +{"current_steps": 33860, "total_steps": 33920, "loss": 0.3083, "lr": 9.85147573284717e-11, "epoch": 19.964622641509433, "percentage": 99.82, "elapsed_time": "1:05:41", "remaining_time": "0:00:06", "throughput": 5654.56, "total_tokens": 22289744} +{"current_steps": 33865, "total_steps": 33920, "loss": 0.2281, "lr": 8.302672359072894e-11, "epoch": 19.96757075471698, "percentage": 99.84, "elapsed_time": "1:05:42", "remaining_time": "0:00:06", "throughput": 5654.53, "total_tokens": 22292656} +{"current_steps": 33870, "total_steps": 33920, "loss": 0.2721, "lr": 6.886243941961468e-11, "epoch": 19.97051886792453, "percentage": 99.85, "elapsed_time": "1:05:42", "remaining_time": "0:00:05", "throughput": 5654.51, "total_tokens": 22295472} +{"current_steps": 33875, "total_steps": 33920, "loss": 0.2705, "lr": 5.602190856601741e-11, "epoch": 19.973466981132077, "percentage": 99.87, "elapsed_time": "1:05:43", "remaining_time": "0:00:05", "throughput": 5654.54, "total_tokens": 22299216} +{"current_steps": 33880, "total_steps": 33920, "loss": 0.3063, "lr": 4.450513442888493e-11, "epoch": 19.97641509433962, "percentage": 99.88, "elapsed_time": "1:05:44", "remaining_time": "0:00:04", "throughput": 5654.58, "total_tokens": 22302512} +{"current_steps": 33885, "total_steps": 33920, "loss": 0.3465, "lr": 3.4312120057999886e-11, "epoch": 19.97936320754717, "percentage": 99.9, "elapsed_time": "1:05:44", "remaining_time": "0:00:04", "throughput": 5654.46, "total_tokens": 22305008} +{"current_steps": 33890, "total_steps": 33920, "loss": 0.3758, "lr": 2.5442868151204224e-11, "epoch": 19.982311320754718, "percentage": 99.91, "elapsed_time": "1:05:45", "remaining_time": "0:00:03", "throughput": 5654.43, "total_tokens": 22308336} +{"current_steps": 33895, "total_steps": 33920, "loss": 0.2291, "lr": 1.7897381057729867e-11, "epoch": 19.985259433962263, "percentage": 99.93, "elapsed_time": "1:05:45", "remaining_time": "0:00:02", "throughput": 5654.34, "total_tokens": 22311120} +{"current_steps": 33900, "total_steps": 33920, "loss": 0.238, "lr": 1.1675660773757813e-11, "epoch": 19.98820754716981, "percentage": 99.94, "elapsed_time": "1:05:46", "remaining_time": "0:00:02", "throughput": 5654.23, "total_tokens": 22313840} +{"current_steps": 33905, "total_steps": 33920, "loss": 0.2988, "lr": 6.777708947969253e-12, "epoch": 19.99115566037736, "percentage": 99.96, "elapsed_time": "1:05:46", "remaining_time": "0:00:01", "throughput": 5654.2, "total_tokens": 22317104} +{"current_steps": 33910, "total_steps": 33920, "loss": 0.3082, "lr": 3.2035268765495674e-12, "epoch": 19.994103773584907, "percentage": 99.97, "elapsed_time": "1:05:47", "remaining_time": "0:00:01", "throughput": 5654.37, "total_tokens": 22321392} +{"current_steps": 33915, "total_steps": 33920, "loss": 0.3209, "lr": 9.531155059638863e-13, "epoch": 19.997051886792452, "percentage": 99.99, "elapsed_time": "1:05:48", "remaining_time": "0:00:00", "throughput": 5654.33, "total_tokens": 22324176} +{"current_steps": 33920, "total_steps": 33920, "loss": 0.3651, "lr": 2.6475431291750342e-14, "epoch": 20.0, "percentage": 100.0, "elapsed_time": "1:05:48", "remaining_time": "0:00:00", "throughput": 5653.98, "total_tokens": 22326528} +{"current_steps": 33920, "total_steps": 33920, "eval_loss": 0.6114597916603088, "epoch": 20.0, "percentage": 100.0, "elapsed_time": "1:06:07", "remaining_time": "0:00:00", "throughput": 5627.39, "total_tokens": 22326528} +{"current_steps": 33920, "total_steps": 33920, "epoch": 20.0, "percentage": 100.0, "elapsed_time": "1:06:10", "remaining_time": "0:00:00", "throughput": 5623.04, "total_tokens": 22326528}