diff --git "a/trainer_log.jsonl" "b/trainer_log.jsonl" new file mode 100644--- /dev/null +++ "b/trainer_log.jsonl" @@ -0,0 +1,1800 @@ +{"current_steps": 5, "total_steps": 179580, "loss": 0.8318, "lr": 1.1137097672346587e-08, "epoch": 0.0005568548836173293, "percentage": 0.0, "elapsed_time": "0:00:02", "remaining_time": "21:26:13", "throughput": 2591.21, "total_tokens": 5568} +{"current_steps": 10, "total_steps": 179580, "loss": 1.1354, "lr": 2.505846976277982e-08, "epoch": 0.0011137097672346587, "percentage": 0.01, "elapsed_time": "0:00:03", "remaining_time": "19:57:05", "throughput": 2928.09, "total_tokens": 11712} +{"current_steps": 15, "total_steps": 179580, "loss": 1.1161, "lr": 3.897984185321305e-08, "epoch": 0.001670564650851988, "percentage": 0.01, "elapsed_time": "0:00:05", "remaining_time": "19:14:05", "throughput": 3037.13, "total_tokens": 17568} +{"current_steps": 20, "total_steps": 179580, "loss": 1.1547, "lr": 5.290121394364629e-08, "epoch": 0.0022274195344693173, "percentage": 0.01, "elapsed_time": "0:00:07", "remaining_time": "19:08:21", "throughput": 3118.89, "total_tokens": 23936} +{"current_steps": 25, "total_steps": 179580, "loss": 1.0458, "lr": 6.682258603407952e-08, "epoch": 0.0027842744180866467, "percentage": 0.01, "elapsed_time": "0:00:09", "remaining_time": "18:43:47", "throughput": 3152.91, "total_tokens": 29600} +{"current_steps": 30, "total_steps": 179580, "loss": 1.1183, "lr": 8.074395812451275e-08, "epoch": 0.003341129301703976, "percentage": 0.02, "elapsed_time": "0:00:11", "remaining_time": "18:42:44", "throughput": 3189.88, "total_tokens": 35904} +{"current_steps": 35, "total_steps": 179580, "loss": 1.3308, "lr": 9.466533021494599e-08, "epoch": 0.0038979841853213053, "percentage": 0.02, "elapsed_time": "0:00:13", "remaining_time": "18:33:30", "throughput": 3208.9, "total_tokens": 41792} +{"current_steps": 40, "total_steps": 179580, "loss": 1.1197, "lr": 1.0858670230537921e-07, "epoch": 0.004454839068938635, "percentage": 0.02, "elapsed_time": "0:00:14", "remaining_time": "18:35:55", "throughput": 3230.66, "total_tokens": 48192} +{"current_steps": 45, "total_steps": 179580, "loss": 1.1992, "lr": 1.2250807439581244e-07, "epoch": 0.005011693952555964, "percentage": 0.03, "elapsed_time": "0:00:16", "remaining_time": "18:38:01", "throughput": 3248.77, "total_tokens": 54624} +{"current_steps": 50, "total_steps": 179580, "loss": 1.0876, "lr": 1.3642944648624568e-07, "epoch": 0.005568548836173293, "percentage": 0.03, "elapsed_time": "0:00:18", "remaining_time": "18:40:01", "throughput": 3263.95, "total_tokens": 61088} +{"current_steps": 55, "total_steps": 179580, "loss": 0.9748, "lr": 1.5035081857667893e-07, "epoch": 0.006125403719790623, "percentage": 0.03, "elapsed_time": "0:00:20", "remaining_time": "18:28:49", "throughput": 3268.73, "total_tokens": 66624} +{"current_steps": 60, "total_steps": 179580, "loss": 1.1689, "lr": 1.6427219066711214e-07, "epoch": 0.006682258603407952, "percentage": 0.03, "elapsed_time": "0:00:22", "remaining_time": "18:25:14", "throughput": 3277.42, "total_tokens": 72640} +{"current_steps": 65, "total_steps": 179580, "loss": 1.0467, "lr": 1.7819356275754539e-07, "epoch": 0.007239113487025281, "percentage": 0.04, "elapsed_time": "0:00:24", "remaining_time": "18:25:57", "throughput": 3282.94, "total_tokens": 78880} +{"current_steps": 70, "total_steps": 179580, "loss": 0.9806, "lr": 1.9211493484797863e-07, "epoch": 0.007795968370642611, "percentage": 0.04, "elapsed_time": "0:00:25", "remaining_time": "18:26:24", "throughput": 3286.95, "total_tokens": 85088} +{"current_steps": 75, "total_steps": 179580, "loss": 0.8412, "lr": 2.0603630693841187e-07, "epoch": 0.00835282325425994, "percentage": 0.04, "elapsed_time": "0:00:27", "remaining_time": "18:27:06", "throughput": 3292.92, "total_tokens": 91392} +{"current_steps": 80, "total_steps": 179580, "loss": 1.1276, "lr": 2.1995767902884511e-07, "epoch": 0.00890967813787727, "percentage": 0.04, "elapsed_time": "0:00:29", "remaining_time": "18:25:27", "throughput": 3297.3, "total_tokens": 97472} +{"current_steps": 85, "total_steps": 179580, "loss": 1.2278, "lr": 2.3387905111927833e-07, "epoch": 0.009466533021494599, "percentage": 0.05, "elapsed_time": "0:00:31", "remaining_time": "18:26:23", "throughput": 3303.25, "total_tokens": 103840} +{"current_steps": 90, "total_steps": 179580, "loss": 1.0851, "lr": 2.478004232097116e-07, "epoch": 0.010023387905111928, "percentage": 0.05, "elapsed_time": "0:00:33", "remaining_time": "18:25:48", "throughput": 3305.93, "total_tokens": 109984} +{"current_steps": 95, "total_steps": 179580, "loss": 1.0056, "lr": 2.617217953001448e-07, "epoch": 0.010580242788729257, "percentage": 0.05, "elapsed_time": "0:00:35", "remaining_time": "18:24:19", "throughput": 3307.59, "total_tokens": 116000} +{"current_steps": 100, "total_steps": 179580, "loss": 0.9123, "lr": 2.7564316739057806e-07, "epoch": 0.011137097672346587, "percentage": 0.06, "elapsed_time": "0:00:36", "remaining_time": "18:20:02", "throughput": 3308.37, "total_tokens": 121664} +{"current_steps": 105, "total_steps": 179580, "loss": 1.1836, "lr": 2.895645394810113e-07, "epoch": 0.011693952555963916, "percentage": 0.06, "elapsed_time": "0:00:38", "remaining_time": "18:21:40", "throughput": 3312.43, "total_tokens": 128096} +{"current_steps": 110, "total_steps": 179580, "loss": 0.9849, "lr": 3.034859115714445e-07, "epoch": 0.012250807439581245, "percentage": 0.06, "elapsed_time": "0:00:40", "remaining_time": "18:19:32", "throughput": 3312.72, "total_tokens": 133952} +{"current_steps": 115, "total_steps": 179580, "loss": 1.0337, "lr": 3.1740728366187776e-07, "epoch": 0.012807662323198575, "percentage": 0.06, "elapsed_time": "0:00:42", "remaining_time": "18:20:05", "throughput": 3314.56, "total_tokens": 140192} +{"current_steps": 120, "total_steps": 179580, "loss": 1.0193, "lr": 3.31328655752311e-07, "epoch": 0.013364517206815904, "percentage": 0.07, "elapsed_time": "0:00:44", "remaining_time": "18:20:20", "throughput": 3319.18, "total_tokens": 146528} +{"current_steps": 125, "total_steps": 179580, "loss": 1.0821, "lr": 3.452500278427442e-07, "epoch": 0.013921372090433233, "percentage": 0.07, "elapsed_time": "0:00:45", "remaining_time": "18:17:51", "throughput": 3316.96, "total_tokens": 152192} +{"current_steps": 130, "total_steps": 179580, "loss": 1.0408, "lr": 3.5917139993317747e-07, "epoch": 0.014478226974050563, "percentage": 0.07, "elapsed_time": "0:00:47", "remaining_time": "18:18:27", "throughput": 3318.26, "total_tokens": 158432} +{"current_steps": 135, "total_steps": 179580, "loss": 1.0441, "lr": 3.730927720236107e-07, "epoch": 0.015035081857667892, "percentage": 0.08, "elapsed_time": "0:00:49", "remaining_time": "18:17:55", "throughput": 3317.54, "total_tokens": 164416} +{"current_steps": 140, "total_steps": 179580, "loss": 1.2402, "lr": 3.870141441140439e-07, "epoch": 0.015591936741285221, "percentage": 0.08, "elapsed_time": "0:00:51", "remaining_time": "18:17:59", "throughput": 3319.58, "total_tokens": 170624} +{"current_steps": 145, "total_steps": 179580, "loss": 1.2169, "lr": 4.009355162044771e-07, "epoch": 0.01614879162490255, "percentage": 0.08, "elapsed_time": "0:00:53", "remaining_time": "18:17:17", "throughput": 3320.13, "total_tokens": 176640} +{"current_steps": 150, "total_steps": 179580, "loss": 1.0648, "lr": 4.148568882949104e-07, "epoch": 0.01670564650851988, "percentage": 0.08, "elapsed_time": "0:00:54", "remaining_time": "18:16:01", "throughput": 3320.76, "total_tokens": 182560} +{"current_steps": 155, "total_steps": 179580, "loss": 1.1075, "lr": 4.2877826038534355e-07, "epoch": 0.017262501392137208, "percentage": 0.09, "elapsed_time": "0:00:56", "remaining_time": "18:17:03", "throughput": 3320.84, "total_tokens": 188832} +{"current_steps": 160, "total_steps": 179580, "loss": 1.0564, "lr": 4.4269963247577687e-07, "epoch": 0.01781935627575454, "percentage": 0.09, "elapsed_time": "0:00:58", "remaining_time": "18:17:38", "throughput": 3322.05, "total_tokens": 195104} +{"current_steps": 165, "total_steps": 179580, "loss": 1.1325, "lr": 4.5662100456621004e-07, "epoch": 0.018376211159371866, "percentage": 0.09, "elapsed_time": "0:01:00", "remaining_time": "18:16:26", "throughput": 3323.16, "total_tokens": 201056} +{"current_steps": 170, "total_steps": 179580, "loss": 0.9384, "lr": 4.705423766566433e-07, "epoch": 0.018933066042989197, "percentage": 0.09, "elapsed_time": "0:01:02", "remaining_time": "18:16:01", "throughput": 3324.69, "total_tokens": 207168} +{"current_steps": 175, "total_steps": 179580, "loss": 0.9964, "lr": 4.844637487470765e-07, "epoch": 0.019489920926606525, "percentage": 0.1, "elapsed_time": "0:01:04", "remaining_time": "18:16:28", "throughput": 3325.52, "total_tokens": 213408} +{"current_steps": 180, "total_steps": 179580, "loss": 1.0757, "lr": 4.983851208375097e-07, "epoch": 0.020046775810223856, "percentage": 0.1, "elapsed_time": "0:01:06", "remaining_time": "18:16:27", "throughput": 3326.63, "total_tokens": 219584} +{"current_steps": 185, "total_steps": 179580, "loss": 1.3252, "lr": 5.12306492927943e-07, "epoch": 0.020603630693841184, "percentage": 0.1, "elapsed_time": "0:01:07", "remaining_time": "18:15:55", "throughput": 3326.96, "total_tokens": 225600} +{"current_steps": 190, "total_steps": 179580, "loss": 1.1059, "lr": 5.262278650183763e-07, "epoch": 0.021160485577458515, "percentage": 0.11, "elapsed_time": "0:01:09", "remaining_time": "18:17:18", "throughput": 3328.37, "total_tokens": 232096} +{"current_steps": 195, "total_steps": 179580, "loss": 1.071, "lr": 5.401492371088094e-07, "epoch": 0.021717340461075842, "percentage": 0.11, "elapsed_time": "0:01:11", "remaining_time": "18:18:05", "throughput": 3329.09, "total_tokens": 238432} +{"current_steps": 200, "total_steps": 179580, "loss": 1.1545, "lr": 5.540706091992427e-07, "epoch": 0.022274195344693173, "percentage": 0.11, "elapsed_time": "0:01:13", "remaining_time": "18:18:04", "throughput": 3330.35, "total_tokens": 244640} +{"current_steps": 205, "total_steps": 179580, "loss": 0.9725, "lr": 5.679919812896759e-07, "epoch": 0.0228310502283105, "percentage": 0.11, "elapsed_time": "0:01:15", "remaining_time": "18:16:48", "throughput": 3331.05, "total_tokens": 250528} +{"current_steps": 210, "total_steps": 179580, "loss": 1.092, "lr": 5.819133533801091e-07, "epoch": 0.023387905111927832, "percentage": 0.12, "elapsed_time": "0:01:17", "remaining_time": "18:17:41", "throughput": 3332.43, "total_tokens": 256960} +{"current_steps": 215, "total_steps": 179580, "loss": 1.2164, "lr": 5.958347254705424e-07, "epoch": 0.02394475999554516, "percentage": 0.12, "elapsed_time": "0:01:18", "remaining_time": "18:18:16", "throughput": 3332.11, "total_tokens": 263200} +{"current_steps": 220, "total_steps": 179580, "loss": 0.9382, "lr": 6.097560975609757e-07, "epoch": 0.02450161487916249, "percentage": 0.12, "elapsed_time": "0:01:20", "remaining_time": "18:18:37", "throughput": 3332.46, "total_tokens": 269440} +{"current_steps": 225, "total_steps": 179580, "loss": 1.2335, "lr": 6.236774696514088e-07, "epoch": 0.02505846976277982, "percentage": 0.13, "elapsed_time": "0:01:22", "remaining_time": "18:18:05", "throughput": 3332.27, "total_tokens": 275424} +{"current_steps": 230, "total_steps": 179580, "loss": 0.954, "lr": 6.375988417418421e-07, "epoch": 0.02561532464639715, "percentage": 0.13, "elapsed_time": "0:01:24", "remaining_time": "18:18:53", "throughput": 3333.82, "total_tokens": 281888} +{"current_steps": 235, "total_steps": 179580, "loss": 1.1002, "lr": 6.515202138322753e-07, "epoch": 0.026172179530014477, "percentage": 0.13, "elapsed_time": "0:01:26", "remaining_time": "18:16:22", "throughput": 3333.03, "total_tokens": 287296} +{"current_steps": 240, "total_steps": 179580, "loss": 1.0977, "lr": 6.654415859227086e-07, "epoch": 0.026729034413631808, "percentage": 0.13, "elapsed_time": "0:01:28", "remaining_time": "18:16:58", "throughput": 3333.31, "total_tokens": 293600} +{"current_steps": 245, "total_steps": 179580, "loss": 0.9896, "lr": 6.793629580131418e-07, "epoch": 0.027285889297249136, "percentage": 0.14, "elapsed_time": "0:01:29", "remaining_time": "18:16:58", "throughput": 3333.87, "total_tokens": 299776} +{"current_steps": 250, "total_steps": 179580, "loss": 1.1586, "lr": 6.932843301035751e-07, "epoch": 0.027842744180866467, "percentage": 0.14, "elapsed_time": "0:01:31", "remaining_time": "18:17:19", "throughput": 3334.73, "total_tokens": 306080} +{"current_steps": 255, "total_steps": 179580, "loss": 1.0317, "lr": 7.072057021940083e-07, "epoch": 0.028399599064483794, "percentage": 0.14, "elapsed_time": "0:01:33", "remaining_time": "18:16:29", "throughput": 3334.68, "total_tokens": 311968} +{"current_steps": 260, "total_steps": 179580, "loss": 0.9848, "lr": 7.211270742844415e-07, "epoch": 0.028956453948101125, "percentage": 0.14, "elapsed_time": "0:01:35", "remaining_time": "18:16:57", "throughput": 3336.11, "total_tokens": 318368} +{"current_steps": 265, "total_steps": 179580, "loss": 0.9667, "lr": 7.350484463748747e-07, "epoch": 0.029513308831718453, "percentage": 0.15, "elapsed_time": "0:01:37", "remaining_time": "18:17:19", "throughput": 3336.79, "total_tokens": 324672} +{"current_steps": 270, "total_steps": 179580, "loss": 1.0205, "lr": 7.48969818465308e-07, "epoch": 0.030070163715335784, "percentage": 0.15, "elapsed_time": "0:01:39", "remaining_time": "18:15:53", "throughput": 3336.38, "total_tokens": 330336} +{"current_steps": 275, "total_steps": 179580, "loss": 1.3045, "lr": 7.628911905557412e-07, "epoch": 0.03062701859895311, "percentage": 0.15, "elapsed_time": "0:01:40", "remaining_time": "18:15:07", "throughput": 3335.1, "total_tokens": 336096} +{"current_steps": 280, "total_steps": 179580, "loss": 1.1382, "lr": 7.768125626461745e-07, "epoch": 0.031183873482570443, "percentage": 0.16, "elapsed_time": "0:01:42", "remaining_time": "18:15:45", "throughput": 3336.18, "total_tokens": 342528} +{"current_steps": 285, "total_steps": 179580, "loss": 1.0932, "lr": 7.907339347366077e-07, "epoch": 0.03174072836618777, "percentage": 0.16, "elapsed_time": "0:01:44", "remaining_time": "18:15:55", "throughput": 3336.15, "total_tokens": 348704} +{"current_steps": 290, "total_steps": 179580, "loss": 1.2194, "lr": 8.046553068270408e-07, "epoch": 0.0322975832498051, "percentage": 0.16, "elapsed_time": "0:01:46", "remaining_time": "18:15:32", "throughput": 3336.29, "total_tokens": 354720} +{"current_steps": 295, "total_steps": 179580, "loss": 1.1577, "lr": 8.185766789174742e-07, "epoch": 0.03285443813342243, "percentage": 0.16, "elapsed_time": "0:01:48", "remaining_time": "18:16:20", "throughput": 3336.66, "total_tokens": 361152} +{"current_steps": 300, "total_steps": 179580, "loss": 0.9648, "lr": 8.324980510079074e-07, "epoch": 0.03341129301703976, "percentage": 0.17, "elapsed_time": "0:01:50", "remaining_time": "18:15:55", "throughput": 3336.33, "total_tokens": 367104} +{"current_steps": 305, "total_steps": 179580, "loss": 1.2782, "lr": 8.464194230983406e-07, "epoch": 0.03396814790065709, "percentage": 0.17, "elapsed_time": "0:01:51", "remaining_time": "18:16:25", "throughput": 3336.63, "total_tokens": 373440} +{"current_steps": 310, "total_steps": 179580, "loss": 0.9992, "lr": 8.603407951887738e-07, "epoch": 0.034525002784274415, "percentage": 0.17, "elapsed_time": "0:01:53", "remaining_time": "18:16:13", "throughput": 3337.36, "total_tokens": 379584} +{"current_steps": 315, "total_steps": 179580, "loss": 1.1739, "lr": 8.742621672792072e-07, "epoch": 0.03508185766789175, "percentage": 0.18, "elapsed_time": "0:01:55", "remaining_time": "18:16:34", "throughput": 3338.32, "total_tokens": 385952} +{"current_steps": 320, "total_steps": 179580, "loss": 1.3828, "lr": 8.881835393696403e-07, "epoch": 0.03563871255150908, "percentage": 0.18, "elapsed_time": "0:01:57", "remaining_time": "18:16:18", "throughput": 3338.66, "total_tokens": 392032} +{"current_steps": 325, "total_steps": 179580, "loss": 0.9624, "lr": 9.021049114600735e-07, "epoch": 0.036195567435126405, "percentage": 0.18, "elapsed_time": "0:01:59", "remaining_time": "18:16:31", "throughput": 3339.11, "total_tokens": 398304} +{"current_steps": 330, "total_steps": 179580, "loss": 0.9696, "lr": 9.160262835505068e-07, "epoch": 0.03675242231874373, "percentage": 0.18, "elapsed_time": "0:02:01", "remaining_time": "18:15:39", "throughput": 3339.17, "total_tokens": 404128} +{"current_steps": 335, "total_steps": 179580, "loss": 0.9918, "lr": 9.2994765564094e-07, "epoch": 0.03730927720236107, "percentage": 0.19, "elapsed_time": "0:02:02", "remaining_time": "18:15:35", "throughput": 3339.21, "total_tokens": 410240} +{"current_steps": 340, "total_steps": 179580, "loss": 0.8052, "lr": 9.438690277313733e-07, "epoch": 0.037866132085978395, "percentage": 0.19, "elapsed_time": "0:02:04", "remaining_time": "18:15:49", "throughput": 3339.3, "total_tokens": 416480} +{"current_steps": 345, "total_steps": 179580, "loss": 1.2185, "lr": 9.577903998218064e-07, "epoch": 0.03842298696959572, "percentage": 0.19, "elapsed_time": "0:02:06", "remaining_time": "18:15:33", "throughput": 3339.44, "total_tokens": 422528} +{"current_steps": 350, "total_steps": 179580, "loss": 1.1212, "lr": 9.717117719122396e-07, "epoch": 0.03897984185321305, "percentage": 0.19, "elapsed_time": "0:02:08", "remaining_time": "18:14:46", "throughput": 3338.88, "total_tokens": 428288} +{"current_steps": 355, "total_steps": 179580, "loss": 1.1558, "lr": 9.856331440026731e-07, "epoch": 0.039536696736830385, "percentage": 0.2, "elapsed_time": "0:02:10", "remaining_time": "18:15:18", "throughput": 3339.33, "total_tokens": 434688} +{"current_steps": 360, "total_steps": 179580, "loss": 1.1384, "lr": 9.995545160931062e-07, "epoch": 0.04009355162044771, "percentage": 0.2, "elapsed_time": "0:02:11", "remaining_time": "18:15:08", "throughput": 3338.69, "total_tokens": 440672} +{"current_steps": 365, "total_steps": 179580, "loss": 0.9096, "lr": 1.0134758881835394e-06, "epoch": 0.04065040650406504, "percentage": 0.2, "elapsed_time": "0:02:13", "remaining_time": "18:15:06", "throughput": 3338.88, "total_tokens": 446816} +{"current_steps": 370, "total_steps": 179580, "loss": 1.0531, "lr": 1.0273972602739725e-06, "epoch": 0.04120726138768237, "percentage": 0.21, "elapsed_time": "0:02:15", "remaining_time": "18:14:52", "throughput": 3339.19, "total_tokens": 452896} +{"current_steps": 375, "total_steps": 179580, "loss": 1.0353, "lr": 1.041318632364406e-06, "epoch": 0.0417641162712997, "percentage": 0.21, "elapsed_time": "0:02:17", "remaining_time": "18:14:54", "throughput": 3339.67, "total_tokens": 459104} +{"current_steps": 380, "total_steps": 179580, "loss": 1.2786, "lr": 1.0552400044548393e-06, "epoch": 0.04232097115491703, "percentage": 0.21, "elapsed_time": "0:02:19", "remaining_time": "18:15:08", "throughput": 3339.93, "total_tokens": 465376} +{"current_steps": 385, "total_steps": 179580, "loss": 0.9737, "lr": 1.0691613765452723e-06, "epoch": 0.04287782603853436, "percentage": 0.21, "elapsed_time": "0:02:21", "remaining_time": "18:15:05", "throughput": 3339.69, "total_tokens": 471456} +{"current_steps": 390, "total_steps": 179580, "loss": 1.0758, "lr": 1.0830827486357056e-06, "epoch": 0.043434680922151685, "percentage": 0.22, "elapsed_time": "0:02:22", "remaining_time": "18:15:02", "throughput": 3339.89, "total_tokens": 477600} +{"current_steps": 395, "total_steps": 179580, "loss": 1.1186, "lr": 1.0970041207261389e-06, "epoch": 0.04399153580576902, "percentage": 0.22, "elapsed_time": "0:02:24", "remaining_time": "18:14:22", "throughput": 3340.2, "total_tokens": 483488} +{"current_steps": 400, "total_steps": 179580, "loss": 1.0204, "lr": 1.1109254928165721e-06, "epoch": 0.04454839068938635, "percentage": 0.22, "elapsed_time": "0:02:26", "remaining_time": "18:14:22", "throughput": 3340.29, "total_tokens": 489632} +{"current_steps": 405, "total_steps": 179580, "loss": 1.1879, "lr": 1.1248468649070052e-06, "epoch": 0.045105245573003674, "percentage": 0.23, "elapsed_time": "0:02:28", "remaining_time": "18:14:20", "throughput": 3340.2, "total_tokens": 495744} +{"current_steps": 410, "total_steps": 179580, "loss": 1.1631, "lr": 1.1387682369974384e-06, "epoch": 0.045662100456621, "percentage": 0.23, "elapsed_time": "0:02:30", "remaining_time": "18:14:23", "throughput": 3340.77, "total_tokens": 501984} +{"current_steps": 415, "total_steps": 179580, "loss": 1.1732, "lr": 1.152689609087872e-06, "epoch": 0.04621895534023834, "percentage": 0.23, "elapsed_time": "0:02:32", "remaining_time": "18:14:23", "throughput": 3340.84, "total_tokens": 508128} +{"current_steps": 420, "total_steps": 179580, "loss": 1.0212, "lr": 1.166610981178305e-06, "epoch": 0.046775810223855664, "percentage": 0.23, "elapsed_time": "0:02:33", "remaining_time": "18:14:09", "throughput": 3340.77, "total_tokens": 514144} +{"current_steps": 425, "total_steps": 179580, "loss": 1.0914, "lr": 1.1805323532687383e-06, "epoch": 0.04733266510747299, "percentage": 0.24, "elapsed_time": "0:02:35", "remaining_time": "18:14:06", "throughput": 3341.17, "total_tokens": 520320} +{"current_steps": 430, "total_steps": 179580, "loss": 1.092, "lr": 1.1944537253591713e-06, "epoch": 0.04788951999109032, "percentage": 0.24, "elapsed_time": "0:02:37", "remaining_time": "18:14:12", "throughput": 3341.75, "total_tokens": 526592} +{"current_steps": 435, "total_steps": 179580, "loss": 1.188, "lr": 1.2083750974496048e-06, "epoch": 0.048446374874707654, "percentage": 0.24, "elapsed_time": "0:02:39", "remaining_time": "18:14:57", "throughput": 3342.08, "total_tokens": 533152} +{"current_steps": 440, "total_steps": 179580, "loss": 1.0808, "lr": 1.2222964695400379e-06, "epoch": 0.04900322975832498, "percentage": 0.25, "elapsed_time": "0:02:41", "remaining_time": "18:14:43", "throughput": 3342.18, "total_tokens": 539200} +{"current_steps": 445, "total_steps": 179580, "loss": 0.9234, "lr": 1.2362178416304711e-06, "epoch": 0.04956008464194231, "percentage": 0.25, "elapsed_time": "0:02:43", "remaining_time": "18:14:29", "throughput": 3342.35, "total_tokens": 545248} +{"current_steps": 450, "total_steps": 179580, "loss": 1.1584, "lr": 1.2501392137209044e-06, "epoch": 0.05011693952555964, "percentage": 0.25, "elapsed_time": "0:02:44", "remaining_time": "18:12:20", "throughput": 3341.34, "total_tokens": 550144} +{"current_steps": 455, "total_steps": 179580, "loss": 1.1143, "lr": 1.2640605858113377e-06, "epoch": 0.05067379440917697, "percentage": 0.25, "elapsed_time": "0:02:46", "remaining_time": "18:12:35", "throughput": 3342.05, "total_tokens": 556512} +{"current_steps": 460, "total_steps": 179580, "loss": 1.2427, "lr": 1.277981957901771e-06, "epoch": 0.0512306492927943, "percentage": 0.26, "elapsed_time": "0:02:48", "remaining_time": "18:12:19", "throughput": 3342.15, "total_tokens": 562528} +{"current_steps": 465, "total_steps": 179580, "loss": 1.1332, "lr": 1.291903329992204e-06, "epoch": 0.051787504176411626, "percentage": 0.26, "elapsed_time": "0:02:50", "remaining_time": "18:13:01", "throughput": 3342.9, "total_tokens": 569152} +{"current_steps": 470, "total_steps": 179580, "loss": 1.1753, "lr": 1.3058247020826373e-06, "epoch": 0.052344359060028954, "percentage": 0.26, "elapsed_time": "0:02:52", "remaining_time": "18:12:47", "throughput": 3342.92, "total_tokens": 575168} +{"current_steps": 475, "total_steps": 179580, "loss": 1.085, "lr": 1.3197460741730707e-06, "epoch": 0.05290121394364629, "percentage": 0.26, "elapsed_time": "0:02:53", "remaining_time": "18:12:40", "throughput": 3343.36, "total_tokens": 581312} +{"current_steps": 480, "total_steps": 179580, "loss": 1.0464, "lr": 1.3336674462635038e-06, "epoch": 0.053458068827263616, "percentage": 0.27, "elapsed_time": "0:02:55", "remaining_time": "18:12:55", "throughput": 3343.55, "total_tokens": 587616} +{"current_steps": 485, "total_steps": 179580, "loss": 0.9421, "lr": 1.347588818353937e-06, "epoch": 0.054014923710880944, "percentage": 0.27, "elapsed_time": "0:02:57", "remaining_time": "18:12:42", "throughput": 3343.5, "total_tokens": 593632} +{"current_steps": 490, "total_steps": 179580, "loss": 0.9928, "lr": 1.3615101904443701e-06, "epoch": 0.05457177859449827, "percentage": 0.27, "elapsed_time": "0:02:59", "remaining_time": "18:11:53", "throughput": 3343.74, "total_tokens": 599360} +{"current_steps": 495, "total_steps": 179580, "loss": 1.0638, "lr": 1.3754315625348036e-06, "epoch": 0.055128633478115606, "percentage": 0.28, "elapsed_time": "0:03:01", "remaining_time": "18:11:53", "throughput": 3343.8, "total_tokens": 605504} +{"current_steps": 500, "total_steps": 179580, "loss": 1.1672, "lr": 1.3893529346252367e-06, "epoch": 0.055685488361732934, "percentage": 0.28, "elapsed_time": "0:03:02", "remaining_time": "18:11:45", "throughput": 3344.24, "total_tokens": 611648} +{"current_steps": 505, "total_steps": 179580, "loss": 1.2417, "lr": 1.40327430671567e-06, "epoch": 0.05624234324535026, "percentage": 0.28, "elapsed_time": "0:03:04", "remaining_time": "18:11:47", "throughput": 3344.58, "total_tokens": 617856} +{"current_steps": 510, "total_steps": 179580, "loss": 1.0426, "lr": 1.4171956788061032e-06, "epoch": 0.05679919812896759, "percentage": 0.28, "elapsed_time": "0:03:06", "remaining_time": "18:11:38", "throughput": 3344.92, "total_tokens": 623968} +{"current_steps": 515, "total_steps": 179580, "loss": 1.3244, "lr": 1.4311170508965365e-06, "epoch": 0.05735605301258492, "percentage": 0.29, "elapsed_time": "0:03:08", "remaining_time": "18:11:14", "throughput": 3345.0, "total_tokens": 629888} +{"current_steps": 520, "total_steps": 179580, "loss": 0.9795, "lr": 1.4450384229869697e-06, "epoch": 0.05791290789620225, "percentage": 0.29, "elapsed_time": "0:03:10", "remaining_time": "18:10:44", "throughput": 3345.4, "total_tokens": 635808} +{"current_steps": 525, "total_steps": 179580, "loss": 1.2212, "lr": 1.4589597950774028e-06, "epoch": 0.05846976277981958, "percentage": 0.29, "elapsed_time": "0:03:11", "remaining_time": "18:10:07", "throughput": 3344.36, "total_tokens": 641376} +{"current_steps": 530, "total_steps": 179580, "loss": 1.1411, "lr": 1.472881167167836e-06, "epoch": 0.059026617663436906, "percentage": 0.3, "elapsed_time": "0:03:13", "remaining_time": "18:09:56", "throughput": 3344.36, "total_tokens": 647392} +{"current_steps": 535, "total_steps": 179580, "loss": 1.2156, "lr": 1.4868025392582693e-06, "epoch": 0.05958347254705424, "percentage": 0.3, "elapsed_time": "0:03:15", "remaining_time": "18:10:05", "throughput": 3344.32, "total_tokens": 653600} +{"current_steps": 540, "total_steps": 179580, "loss": 1.2132, "lr": 1.5007239113487026e-06, "epoch": 0.06014032743067157, "percentage": 0.3, "elapsed_time": "0:03:17", "remaining_time": "18:10:43", "throughput": 3344.38, "total_tokens": 660128} +{"current_steps": 545, "total_steps": 179580, "loss": 1.1318, "lr": 1.5146452834391359e-06, "epoch": 0.060697182314288896, "percentage": 0.3, "elapsed_time": "0:03:19", "remaining_time": "18:10:15", "throughput": 3343.97, "total_tokens": 665888} +{"current_steps": 550, "total_steps": 179580, "loss": 1.0766, "lr": 1.528566655529569e-06, "epoch": 0.06125403719790622, "percentage": 0.31, "elapsed_time": "0:03:20", "remaining_time": "18:10:18", "throughput": 3344.35, "total_tokens": 672128} +{"current_steps": 555, "total_steps": 179580, "loss": 1.3743, "lr": 1.5424880276200024e-06, "epoch": 0.06181089208152356, "percentage": 0.31, "elapsed_time": "0:03:22", "remaining_time": "18:09:28", "throughput": 3344.18, "total_tokens": 677696} +{"current_steps": 560, "total_steps": 179580, "loss": 1.1487, "lr": 1.5564093997104355e-06, "epoch": 0.062367746965140886, "percentage": 0.31, "elapsed_time": "0:03:24", "remaining_time": "18:09:48", "throughput": 3344.31, "total_tokens": 684064} +{"current_steps": 565, "total_steps": 179580, "loss": 1.0237, "lr": 1.5703307718008687e-06, "epoch": 0.06292460184875821, "percentage": 0.31, "elapsed_time": "0:03:26", "remaining_time": "18:09:52", "throughput": 3344.5, "total_tokens": 690272} +{"current_steps": 570, "total_steps": 179580, "loss": 1.0703, "lr": 1.584252143891302e-06, "epoch": 0.06348145673237554, "percentage": 0.32, "elapsed_time": "0:03:28", "remaining_time": "18:09:11", "throughput": 3344.52, "total_tokens": 695968} +{"current_steps": 575, "total_steps": 179580, "loss": 1.239, "lr": 1.598173515981735e-06, "epoch": 0.06403831161599287, "percentage": 0.32, "elapsed_time": "0:03:29", "remaining_time": "18:09:30", "throughput": 3344.57, "total_tokens": 702304} +{"current_steps": 580, "total_steps": 179580, "loss": 0.9902, "lr": 1.6120948880721683e-06, "epoch": 0.0645951664996102, "percentage": 0.32, "elapsed_time": "0:03:31", "remaining_time": "18:09:38", "throughput": 3344.56, "total_tokens": 708512} +{"current_steps": 585, "total_steps": 179580, "loss": 1.2604, "lr": 1.6260162601626018e-06, "epoch": 0.06515202138322754, "percentage": 0.33, "elapsed_time": "0:03:33", "remaining_time": "18:09:51", "throughput": 3345.15, "total_tokens": 714912} +{"current_steps": 590, "total_steps": 179580, "loss": 1.3001, "lr": 1.639937632253035e-06, "epoch": 0.06570887626684487, "percentage": 0.33, "elapsed_time": "0:03:35", "remaining_time": "18:09:46", "throughput": 3345.35, "total_tokens": 721024} +{"current_steps": 595, "total_steps": 179580, "loss": 1.1155, "lr": 1.6538590043434682e-06, "epoch": 0.06626573115046219, "percentage": 0.33, "elapsed_time": "0:03:37", "remaining_time": "18:09:51", "throughput": 3345.12, "total_tokens": 727168} +{"current_steps": 600, "total_steps": 179580, "loss": 1.2763, "lr": 1.6677803764339014e-06, "epoch": 0.06682258603407952, "percentage": 0.33, "elapsed_time": "0:03:39", "remaining_time": "18:09:47", "throughput": 3344.66, "total_tokens": 733152} +{"current_steps": 605, "total_steps": 179580, "loss": 1.0431, "lr": 1.6817017485243347e-06, "epoch": 0.06737944091769685, "percentage": 0.34, "elapsed_time": "0:03:41", "remaining_time": "18:09:55", "throughput": 3344.48, "total_tokens": 739328} +{"current_steps": 610, "total_steps": 179580, "loss": 1.0579, "lr": 1.6956231206147678e-06, "epoch": 0.06793629580131418, "percentage": 0.34, "elapsed_time": "0:03:42", "remaining_time": "18:09:58", "throughput": 3344.82, "total_tokens": 745568} +{"current_steps": 615, "total_steps": 179580, "loss": 1.0363, "lr": 1.709544492705201e-06, "epoch": 0.0684931506849315, "percentage": 0.34, "elapsed_time": "0:03:44", "remaining_time": "18:10:04", "throughput": 3345.28, "total_tokens": 751872} +{"current_steps": 620, "total_steps": 179580, "loss": 1.2397, "lr": 1.7234658647956343e-06, "epoch": 0.06905000556854883, "percentage": 0.35, "elapsed_time": "0:03:46", "remaining_time": "18:09:43", "throughput": 3345.52, "total_tokens": 757824} +{"current_steps": 625, "total_steps": 179580, "loss": 1.0931, "lr": 1.7373872368860673e-06, "epoch": 0.06960686045216617, "percentage": 0.35, "elapsed_time": "0:03:48", "remaining_time": "18:10:04", "throughput": 3346.03, "total_tokens": 764320} +{"current_steps": 630, "total_steps": 179580, "loss": 1.2674, "lr": 1.751308608976501e-06, "epoch": 0.0701637153357835, "percentage": 0.35, "elapsed_time": "0:03:50", "remaining_time": "18:10:13", "throughput": 3346.19, "total_tokens": 770592} +{"current_steps": 635, "total_steps": 179580, "loss": 1.0855, "lr": 1.765229981066934e-06, "epoch": 0.07072057021940083, "percentage": 0.35, "elapsed_time": "0:03:51", "remaining_time": "18:09:11", "throughput": 3346.04, "total_tokens": 775968} +{"current_steps": 640, "total_steps": 179580, "loss": 1.1887, "lr": 1.7791513531573674e-06, "epoch": 0.07127742510301815, "percentage": 0.36, "elapsed_time": "0:03:53", "remaining_time": "18:09:14", "throughput": 3346.11, "total_tokens": 782144} +{"current_steps": 645, "total_steps": 179580, "loss": 1.089, "lr": 1.7930727252478004e-06, "epoch": 0.07183427998663548, "percentage": 0.36, "elapsed_time": "0:03:55", "remaining_time": "18:09:16", "throughput": 3346.32, "total_tokens": 788352} +{"current_steps": 650, "total_steps": 179580, "loss": 1.1123, "lr": 1.8069940973382337e-06, "epoch": 0.07239113487025281, "percentage": 0.36, "elapsed_time": "0:03:57", "remaining_time": "18:09:11", "throughput": 3346.47, "total_tokens": 794464} +{"current_steps": 655, "total_steps": 179580, "loss": 1.363, "lr": 1.820915469428667e-06, "epoch": 0.07294798975387014, "percentage": 0.36, "elapsed_time": "0:03:59", "remaining_time": "18:09:07", "throughput": 3346.74, "total_tokens": 800608} +{"current_steps": 660, "total_steps": 179580, "loss": 1.1472, "lr": 1.8348368415191e-06, "epoch": 0.07350484463748747, "percentage": 0.37, "elapsed_time": "0:04:00", "remaining_time": "18:08:42", "throughput": 3346.61, "total_tokens": 806400} +{"current_steps": 665, "total_steps": 179580, "loss": 1.1022, "lr": 1.8487582136095333e-06, "epoch": 0.0740616995211048, "percentage": 0.37, "elapsed_time": "0:04:02", "remaining_time": "18:08:42", "throughput": 3346.26, "total_tokens": 812448} +{"current_steps": 670, "total_steps": 179580, "loss": 1.2521, "lr": 1.8626795856999668e-06, "epoch": 0.07461855440472213, "percentage": 0.37, "elapsed_time": "0:04:04", "remaining_time": "18:07:59", "throughput": 3346.0, "total_tokens": 817984} +{"current_steps": 675, "total_steps": 179580, "loss": 1.0763, "lr": 1.8766009577904e-06, "epoch": 0.07517540928833946, "percentage": 0.38, "elapsed_time": "0:04:06", "remaining_time": "18:07:40", "throughput": 3345.65, "total_tokens": 823776} +{"current_steps": 680, "total_steps": 179580, "loss": 1.0381, "lr": 1.890522329880833e-06, "epoch": 0.07573226417195679, "percentage": 0.38, "elapsed_time": "0:04:08", "remaining_time": "18:07:46", "throughput": 3346.05, "total_tokens": 830080} +{"current_steps": 685, "total_steps": 179580, "loss": 0.9918, "lr": 1.9044437019712664e-06, "epoch": 0.07628911905557412, "percentage": 0.38, "elapsed_time": "0:04:09", "remaining_time": "18:07:53", "throughput": 3345.99, "total_tokens": 836288} +{"current_steps": 690, "total_steps": 179580, "loss": 1.2199, "lr": 1.9183650740616994e-06, "epoch": 0.07684597393919144, "percentage": 0.38, "elapsed_time": "0:04:11", "remaining_time": "18:07:56", "throughput": 3346.15, "total_tokens": 842496} +{"current_steps": 695, "total_steps": 179580, "loss": 0.9891, "lr": 1.932286446152133e-06, "epoch": 0.07740282882280877, "percentage": 0.39, "elapsed_time": "0:04:13", "remaining_time": "18:07:28", "throughput": 3346.17, "total_tokens": 848256} +{"current_steps": 700, "total_steps": 179580, "loss": 0.98, "lr": 1.946207818242566e-06, "epoch": 0.0779596837064261, "percentage": 0.39, "elapsed_time": "0:04:15", "remaining_time": "18:07:05", "throughput": 3346.02, "total_tokens": 854048} +{"current_steps": 705, "total_steps": 179580, "loss": 1.0428, "lr": 1.960129190332999e-06, "epoch": 0.07851653859004344, "percentage": 0.39, "elapsed_time": "0:04:17", "remaining_time": "18:06:58", "throughput": 3345.94, "total_tokens": 860064} +{"current_steps": 710, "total_steps": 179580, "loss": 1.1893, "lr": 1.9740505624234325e-06, "epoch": 0.07907339347366077, "percentage": 0.4, "elapsed_time": "0:04:18", "remaining_time": "18:07:04", "throughput": 3345.72, "total_tokens": 866208} +{"current_steps": 715, "total_steps": 179580, "loss": 1.3148, "lr": 1.987971934513866e-06, "epoch": 0.0796302483572781, "percentage": 0.4, "elapsed_time": "0:04:20", "remaining_time": "18:07:07", "throughput": 3345.91, "total_tokens": 872416} +{"current_steps": 720, "total_steps": 179580, "loss": 0.9405, "lr": 2.001893306604299e-06, "epoch": 0.08018710324089542, "percentage": 0.4, "elapsed_time": "0:04:22", "remaining_time": "18:07:15", "throughput": 3345.81, "total_tokens": 878624} +{"current_steps": 725, "total_steps": 179580, "loss": 1.244, "lr": 2.015814678694732e-06, "epoch": 0.08074395812451275, "percentage": 0.4, "elapsed_time": "0:04:24", "remaining_time": "18:07:22", "throughput": 3345.72, "total_tokens": 884832} +{"current_steps": 730, "total_steps": 179580, "loss": 1.161, "lr": 2.0297360507851656e-06, "epoch": 0.08130081300813008, "percentage": 0.41, "elapsed_time": "0:04:26", "remaining_time": "18:07:25", "throughput": 3345.77, "total_tokens": 891008} +{"current_steps": 735, "total_steps": 179580, "loss": 1.222, "lr": 2.0436574228755986e-06, "epoch": 0.08185766789174741, "percentage": 0.41, "elapsed_time": "0:04:28", "remaining_time": "18:07:14", "throughput": 3346.04, "total_tokens": 897056} +{"current_steps": 740, "total_steps": 179580, "loss": 1.3422, "lr": 2.0575787949660317e-06, "epoch": 0.08241452277536473, "percentage": 0.41, "elapsed_time": "0:04:29", "remaining_time": "18:06:27", "throughput": 3345.8, "total_tokens": 902464} +{"current_steps": 745, "total_steps": 179580, "loss": 1.1227, "lr": 2.071500167056465e-06, "epoch": 0.08297137765898208, "percentage": 0.41, "elapsed_time": "0:04:31", "remaining_time": "18:06:46", "throughput": 3345.96, "total_tokens": 908896} +{"current_steps": 750, "total_steps": 179580, "loss": 1.292, "lr": 2.0854215391468987e-06, "epoch": 0.0835282325425994, "percentage": 0.42, "elapsed_time": "0:04:33", "remaining_time": "18:06:37", "throughput": 3346.11, "total_tokens": 914944} +{"current_steps": 755, "total_steps": 179580, "loss": 1.3656, "lr": 2.0993429112373317e-06, "epoch": 0.08408508742621673, "percentage": 0.42, "elapsed_time": "0:04:35", "remaining_time": "18:06:43", "throughput": 3346.01, "total_tokens": 921120} +{"current_steps": 760, "total_steps": 179580, "loss": 1.0275, "lr": 2.1132642833277648e-06, "epoch": 0.08464194230983406, "percentage": 0.42, "elapsed_time": "0:04:37", "remaining_time": "18:06:37", "throughput": 3346.04, "total_tokens": 927168} +{"current_steps": 765, "total_steps": 179580, "loss": 1.0787, "lr": 2.1271856554181983e-06, "epoch": 0.08519879719345139, "percentage": 0.43, "elapsed_time": "0:04:38", "remaining_time": "18:06:30", "throughput": 3346.11, "total_tokens": 933216} +{"current_steps": 770, "total_steps": 179580, "loss": 1.1377, "lr": 2.1411070275086313e-06, "epoch": 0.08575565207706871, "percentage": 0.43, "elapsed_time": "0:04:40", "remaining_time": "18:06:16", "throughput": 3346.08, "total_tokens": 939136} +{"current_steps": 775, "total_steps": 179580, "loss": 0.8717, "lr": 2.1550283995990644e-06, "epoch": 0.08631250696068604, "percentage": 0.43, "elapsed_time": "0:04:42", "remaining_time": "18:06:10", "throughput": 3346.04, "total_tokens": 945152} +{"current_steps": 780, "total_steps": 179580, "loss": 1.0807, "lr": 2.168949771689498e-06, "epoch": 0.08686936184430337, "percentage": 0.43, "elapsed_time": "0:04:44", "remaining_time": "18:05:54", "throughput": 3346.15, "total_tokens": 951072} +{"current_steps": 785, "total_steps": 179580, "loss": 1.1092, "lr": 2.182871143779931e-06, "epoch": 0.0874262167279207, "percentage": 0.44, "elapsed_time": "0:04:45", "remaining_time": "18:05:39", "throughput": 3345.94, "total_tokens": 956928} +{"current_steps": 790, "total_steps": 179580, "loss": 1.2791, "lr": 2.1967925158703644e-06, "epoch": 0.08798307161153804, "percentage": 0.44, "elapsed_time": "0:04:47", "remaining_time": "18:05:52", "throughput": 3346.37, "total_tokens": 963360} +{"current_steps": 795, "total_steps": 179580, "loss": 1.0768, "lr": 2.2107138879607975e-06, "epoch": 0.08853992649515537, "percentage": 0.44, "elapsed_time": "0:04:49", "remaining_time": "18:06:06", "throughput": 3346.28, "total_tokens": 969664} +{"current_steps": 800, "total_steps": 179580, "loss": 1.409, "lr": 2.224635260051231e-06, "epoch": 0.0890967813787727, "percentage": 0.45, "elapsed_time": "0:04:51", "remaining_time": "18:06:16", "throughput": 3346.72, "total_tokens": 976064} +{"current_steps": 805, "total_steps": 179580, "loss": 1.0975, "lr": 2.238556632141664e-06, "epoch": 0.08965363626239002, "percentage": 0.45, "elapsed_time": "0:04:53", "remaining_time": "18:06:24", "throughput": 3346.77, "total_tokens": 982336} +{"current_steps": 810, "total_steps": 179580, "loss": 1.2597, "lr": 2.252478004232097e-06, "epoch": 0.09021049114600735, "percentage": 0.45, "elapsed_time": "0:04:55", "remaining_time": "18:05:40", "throughput": 3346.39, "total_tokens": 987680} +{"current_steps": 815, "total_steps": 179580, "loss": 1.2637, "lr": 2.2663993763225305e-06, "epoch": 0.09076734602962468, "percentage": 0.45, "elapsed_time": "0:04:57", "remaining_time": "18:05:57", "throughput": 3346.67, "total_tokens": 994144} +{"current_steps": 820, "total_steps": 179580, "loss": 1.1318, "lr": 2.2803207484129636e-06, "epoch": 0.091324200913242, "percentage": 0.46, "elapsed_time": "0:04:58", "remaining_time": "18:05:55", "throughput": 3346.48, "total_tokens": 1000192} +{"current_steps": 825, "total_steps": 179580, "loss": 1.2271, "lr": 2.2942421205033967e-06, "epoch": 0.09188105579685933, "percentage": 0.46, "elapsed_time": "0:05:00", "remaining_time": "18:05:55", "throughput": 3346.45, "total_tokens": 1006304} +{"current_steps": 830, "total_steps": 179580, "loss": 1.2139, "lr": 2.30816349259383e-06, "epoch": 0.09243791068047667, "percentage": 0.46, "elapsed_time": "0:05:02", "remaining_time": "18:06:02", "throughput": 3346.34, "total_tokens": 1012512} +{"current_steps": 835, "total_steps": 179580, "loss": 1.056, "lr": 2.3220848646842636e-06, "epoch": 0.092994765564094, "percentage": 0.46, "elapsed_time": "0:05:04", "remaining_time": "18:06:09", "throughput": 3346.24, "total_tokens": 1018720} +{"current_steps": 840, "total_steps": 179580, "loss": 1.1158, "lr": 2.3360062367746967e-06, "epoch": 0.09355162044771133, "percentage": 0.47, "elapsed_time": "0:05:06", "remaining_time": "18:05:35", "throughput": 3346.08, "total_tokens": 1024256} +{"current_steps": 845, "total_steps": 179580, "loss": 1.0849, "lr": 2.3499276088651297e-06, "epoch": 0.09410847533132866, "percentage": 0.47, "elapsed_time": "0:05:07", "remaining_time": "18:05:41", "throughput": 3346.03, "total_tokens": 1030464} +{"current_steps": 850, "total_steps": 179580, "loss": 1.1233, "lr": 2.3638489809555632e-06, "epoch": 0.09466533021494598, "percentage": 0.47, "elapsed_time": "0:05:09", "remaining_time": "18:05:27", "throughput": 3345.86, "total_tokens": 1036320} +{"current_steps": 855, "total_steps": 179580, "loss": 0.9331, "lr": 2.3777703530459963e-06, "epoch": 0.09522218509856331, "percentage": 0.48, "elapsed_time": "0:05:11", "remaining_time": "18:05:33", "throughput": 3345.91, "total_tokens": 1042560} +{"current_steps": 860, "total_steps": 179580, "loss": 1.3178, "lr": 2.3916917251364293e-06, "epoch": 0.09577903998218064, "percentage": 0.48, "elapsed_time": "0:05:13", "remaining_time": "18:05:40", "throughput": 3346.02, "total_tokens": 1048832} +{"current_steps": 865, "total_steps": 179580, "loss": 1.3257, "lr": 2.405613097226863e-06, "epoch": 0.09633589486579797, "percentage": 0.48, "elapsed_time": "0:05:15", "remaining_time": "18:05:41", "throughput": 3345.92, "total_tokens": 1054944} +{"current_steps": 870, "total_steps": 179580, "loss": 1.0747, "lr": 2.4195344693172963e-06, "epoch": 0.09689274974941531, "percentage": 0.48, "elapsed_time": "0:05:17", "remaining_time": "18:05:41", "throughput": 3345.88, "total_tokens": 1061056} +{"current_steps": 875, "total_steps": 179580, "loss": 0.8992, "lr": 2.4334558414077293e-06, "epoch": 0.09744960463303264, "percentage": 0.49, "elapsed_time": "0:05:18", "remaining_time": "18:05:24", "throughput": 3345.61, "total_tokens": 1066816} +{"current_steps": 880, "total_steps": 179580, "loss": 0.9768, "lr": 2.4473772134981624e-06, "epoch": 0.09800645951664996, "percentage": 0.49, "elapsed_time": "0:05:20", "remaining_time": "18:05:18", "throughput": 3345.26, "total_tokens": 1072736} +{"current_steps": 885, "total_steps": 179580, "loss": 1.1802, "lr": 2.461298585588596e-06, "epoch": 0.09856331440026729, "percentage": 0.49, "elapsed_time": "0:05:22", "remaining_time": "18:05:27", "throughput": 3345.47, "total_tokens": 1079072} +{"current_steps": 890, "total_steps": 179580, "loss": 1.3935, "lr": 2.475219957679029e-06, "epoch": 0.09912016928388462, "percentage": 0.5, "elapsed_time": "0:05:24", "remaining_time": "18:05:25", "throughput": 3345.79, "total_tokens": 1085280} +{"current_steps": 895, "total_steps": 179580, "loss": 1.0257, "lr": 2.489141329769462e-06, "epoch": 0.09967702416750195, "percentage": 0.5, "elapsed_time": "0:05:26", "remaining_time": "18:05:31", "throughput": 3345.72, "total_tokens": 1091488} +{"current_steps": 900, "total_steps": 179580, "loss": 1.3654, "lr": 2.5030627018598955e-06, "epoch": 0.10023387905111927, "percentage": 0.5, "elapsed_time": "0:05:27", "remaining_time": "18:04:59", "throughput": 3345.48, "total_tokens": 1096992} +{"current_steps": 905, "total_steps": 179580, "loss": 1.1658, "lr": 2.5169840739503285e-06, "epoch": 0.1007907339347366, "percentage": 0.5, "elapsed_time": "0:05:29", "remaining_time": "18:05:01", "throughput": 3345.54, "total_tokens": 1103168} +{"current_steps": 910, "total_steps": 179580, "loss": 1.2801, "lr": 2.530905446040762e-06, "epoch": 0.10134758881835394, "percentage": 0.51, "elapsed_time": "0:05:31", "remaining_time": "18:05:02", "throughput": 3345.61, "total_tokens": 1109344} +{"current_steps": 915, "total_steps": 179580, "loss": 1.1251, "lr": 2.544826818131195e-06, "epoch": 0.10190444370197127, "percentage": 0.51, "elapsed_time": "0:05:33", "remaining_time": "18:05:11", "throughput": 3345.83, "total_tokens": 1115680} +{"current_steps": 920, "total_steps": 179580, "loss": 1.0953, "lr": 2.5587481902216286e-06, "epoch": 0.1024612985855886, "percentage": 0.51, "elapsed_time": "0:05:35", "remaining_time": "18:05:10", "throughput": 3345.71, "total_tokens": 1121760} +{"current_steps": 925, "total_steps": 179580, "loss": 1.1253, "lr": 2.5726695623120616e-06, "epoch": 0.10301815346920593, "percentage": 0.52, "elapsed_time": "0:05:37", "remaining_time": "18:05:12", "throughput": 3345.77, "total_tokens": 1127936} +{"current_steps": 930, "total_steps": 179580, "loss": 1.0166, "lr": 2.5865909344024947e-06, "epoch": 0.10357500835282325, "percentage": 0.52, "elapsed_time": "0:05:39", "remaining_time": "18:05:23", "throughput": 3345.78, "total_tokens": 1134272} +{"current_steps": 935, "total_steps": 179580, "loss": 1.1149, "lr": 2.600512306492928e-06, "epoch": 0.10413186323644058, "percentage": 0.52, "elapsed_time": "0:05:40", "remaining_time": "18:04:55", "throughput": 3345.39, "total_tokens": 1139776} +{"current_steps": 940, "total_steps": 179580, "loss": 0.9964, "lr": 2.6144336785833612e-06, "epoch": 0.10468871812005791, "percentage": 0.52, "elapsed_time": "0:05:42", "remaining_time": "18:04:52", "throughput": 3345.23, "total_tokens": 1145792} +{"current_steps": 945, "total_steps": 179580, "loss": 1.0894, "lr": 2.6283550506737943e-06, "epoch": 0.10524557300367524, "percentage": 0.53, "elapsed_time": "0:05:44", "remaining_time": "18:04:55", "throughput": 3345.41, "total_tokens": 1152032} +{"current_steps": 950, "total_steps": 179580, "loss": 0.9707, "lr": 2.6422764227642278e-06, "epoch": 0.10580242788729258, "percentage": 0.53, "elapsed_time": "0:05:46", "remaining_time": "18:05:01", "throughput": 3345.52, "total_tokens": 1158304} +{"current_steps": 955, "total_steps": 179580, "loss": 1.0918, "lr": 2.6561977948546612e-06, "epoch": 0.1063592827709099, "percentage": 0.53, "elapsed_time": "0:05:48", "remaining_time": "18:04:55", "throughput": 3345.58, "total_tokens": 1164352} +{"current_steps": 960, "total_steps": 179580, "loss": 1.3314, "lr": 2.6701191669450943e-06, "epoch": 0.10691613765452723, "percentage": 0.53, "elapsed_time": "0:05:49", "remaining_time": "18:04:54", "throughput": 3345.98, "total_tokens": 1170592} +{"current_steps": 965, "total_steps": 179580, "loss": 0.9679, "lr": 2.6840405390355274e-06, "epoch": 0.10747299253814456, "percentage": 0.54, "elapsed_time": "0:05:51", "remaining_time": "18:05:07", "throughput": 3346.17, "total_tokens": 1177024} +{"current_steps": 970, "total_steps": 179580, "loss": 1.2934, "lr": 2.697961911125961e-06, "epoch": 0.10802984742176189, "percentage": 0.54, "elapsed_time": "0:05:53", "remaining_time": "18:05:09", "throughput": 3346.34, "total_tokens": 1183264} +{"current_steps": 975, "total_steps": 179580, "loss": 1.0349, "lr": 2.711883283216394e-06, "epoch": 0.10858670230537922, "percentage": 0.54, "elapsed_time": "0:05:55", "remaining_time": "18:05:08", "throughput": 3346.33, "total_tokens": 1189376} +{"current_steps": 980, "total_steps": 179580, "loss": 1.1246, "lr": 2.725804655306827e-06, "epoch": 0.10914355718899654, "percentage": 0.55, "elapsed_time": "0:05:57", "remaining_time": "18:05:21", "throughput": 3346.53, "total_tokens": 1195808} +{"current_steps": 985, "total_steps": 179580, "loss": 0.9264, "lr": 2.7397260273972604e-06, "epoch": 0.10970041207261387, "percentage": 0.55, "elapsed_time": "0:05:59", "remaining_time": "18:04:55", "throughput": 3346.18, "total_tokens": 1201344} +{"current_steps": 990, "total_steps": 179580, "loss": 1.0556, "lr": 2.753647399487694e-06, "epoch": 0.11025726695623121, "percentage": 0.55, "elapsed_time": "0:06:00", "remaining_time": "18:04:51", "throughput": 3346.17, "total_tokens": 1207392} +{"current_steps": 995, "total_steps": 179580, "loss": 0.9249, "lr": 2.767568771578127e-06, "epoch": 0.11081412183984854, "percentage": 0.55, "elapsed_time": "0:06:02", "remaining_time": "18:04:55", "throughput": 3346.22, "total_tokens": 1213632} +{"current_steps": 1000, "total_steps": 179580, "loss": 1.1363, "lr": 2.78149014366856e-06, "epoch": 0.11137097672346587, "percentage": 0.56, "elapsed_time": "0:06:04", "remaining_time": "18:04:52", "throughput": 3346.36, "total_tokens": 1219744} +{"current_steps": 1005, "total_steps": 179580, "loss": 1.0306, "lr": 2.7954115157589935e-06, "epoch": 0.1119278316070832, "percentage": 0.56, "elapsed_time": "0:06:06", "remaining_time": "18:05:05", "throughput": 3346.74, "total_tokens": 1226272} +{"current_steps": 1010, "total_steps": 179580, "loss": 1.2631, "lr": 2.8093328878494266e-06, "epoch": 0.11248468649070052, "percentage": 0.56, "elapsed_time": "0:06:08", "remaining_time": "18:04:32", "throughput": 3346.71, "total_tokens": 1231776} +{"current_steps": 1015, "total_steps": 179580, "loss": 1.3833, "lr": 2.8232542599398596e-06, "epoch": 0.11304154137431785, "percentage": 0.57, "elapsed_time": "0:06:09", "remaining_time": "18:04:20", "throughput": 3346.44, "total_tokens": 1237568} +{"current_steps": 1020, "total_steps": 179580, "loss": 1.0084, "lr": 2.837175632030293e-06, "epoch": 0.11359839625793518, "percentage": 0.57, "elapsed_time": "0:06:11", "remaining_time": "18:04:27", "throughput": 3346.56, "total_tokens": 1243872} +{"current_steps": 1025, "total_steps": 179580, "loss": 1.0141, "lr": 2.851097004120726e-06, "epoch": 0.1141552511415525, "percentage": 0.57, "elapsed_time": "0:06:13", "remaining_time": "18:04:41", "throughput": 3346.59, "total_tokens": 1250304} +{"current_steps": 1030, "total_steps": 179580, "loss": 1.121, "lr": 2.8650183762111596e-06, "epoch": 0.11471210602516985, "percentage": 0.57, "elapsed_time": "0:06:15", "remaining_time": "18:04:22", "throughput": 3346.61, "total_tokens": 1256064} +{"current_steps": 1035, "total_steps": 179580, "loss": 1.1759, "lr": 2.8789397483015927e-06, "epoch": 0.11526896090878717, "percentage": 0.58, "elapsed_time": "0:06:17", "remaining_time": "18:04:31", "throughput": 3346.78, "total_tokens": 1262432} +{"current_steps": 1040, "total_steps": 179580, "loss": 0.8641, "lr": 2.892861120392026e-06, "epoch": 0.1158258157924045, "percentage": 0.58, "elapsed_time": "0:06:19", "remaining_time": "18:04:32", "throughput": 3346.84, "total_tokens": 1268608} +{"current_steps": 1045, "total_steps": 179580, "loss": 0.9659, "lr": 2.9067824924824592e-06, "epoch": 0.11638267067602183, "percentage": 0.58, "elapsed_time": "0:06:20", "remaining_time": "18:04:25", "throughput": 3346.52, "total_tokens": 1274496} +{"current_steps": 1050, "total_steps": 179580, "loss": 0.9391, "lr": 2.9207038645728923e-06, "epoch": 0.11693952555963916, "percentage": 0.58, "elapsed_time": "0:06:22", "remaining_time": "18:03:57", "throughput": 3346.55, "total_tokens": 1280096} +{"current_steps": 1055, "total_steps": 179580, "loss": 1.1985, "lr": 2.9346252366633258e-06, "epoch": 0.11749638044325648, "percentage": 0.59, "elapsed_time": "0:06:24", "remaining_time": "18:04:02", "throughput": 3346.44, "total_tokens": 1286272} +{"current_steps": 1060, "total_steps": 179580, "loss": 1.0626, "lr": 2.948546608753759e-06, "epoch": 0.11805323532687381, "percentage": 0.59, "elapsed_time": "0:06:26", "remaining_time": "18:03:53", "throughput": 3346.53, "total_tokens": 1292256} +{"current_steps": 1065, "total_steps": 179580, "loss": 1.082, "lr": 2.962467980844192e-06, "epoch": 0.11861009021049114, "percentage": 0.59, "elapsed_time": "0:06:27", "remaining_time": "18:03:38", "throughput": 3346.39, "total_tokens": 1298048} +{"current_steps": 1070, "total_steps": 179580, "loss": 1.056, "lr": 2.9763893529346254e-06, "epoch": 0.11916694509410848, "percentage": 0.6, "elapsed_time": "0:06:29", "remaining_time": "18:03:40", "throughput": 3346.49, "total_tokens": 1304256} +{"current_steps": 1075, "total_steps": 179580, "loss": 1.0467, "lr": 2.990310725025059e-06, "epoch": 0.11972379997772581, "percentage": 0.6, "elapsed_time": "0:06:31", "remaining_time": "18:03:58", "throughput": 3346.76, "total_tokens": 1310848} +{"current_steps": 1080, "total_steps": 179580, "loss": 1.0704, "lr": 3.004232097115492e-06, "epoch": 0.12028065486134314, "percentage": 0.6, "elapsed_time": "0:06:33", "remaining_time": "18:03:29", "throughput": 3346.46, "total_tokens": 1316288} +{"current_steps": 1085, "total_steps": 179580, "loss": 1.0888, "lr": 3.018153469205925e-06, "epoch": 0.12083750974496046, "percentage": 0.6, "elapsed_time": "0:06:35", "remaining_time": "18:03:40", "throughput": 3346.51, "total_tokens": 1322656} +{"current_steps": 1090, "total_steps": 179580, "loss": 1.0922, "lr": 3.0320748412963585e-06, "epoch": 0.12139436462857779, "percentage": 0.61, "elapsed_time": "0:06:37", "remaining_time": "18:03:37", "throughput": 3346.48, "total_tokens": 1328704} +{"current_steps": 1095, "total_steps": 179580, "loss": 1.2838, "lr": 3.0459962133867915e-06, "epoch": 0.12195121951219512, "percentage": 0.61, "elapsed_time": "0:06:38", "remaining_time": "18:03:34", "throughput": 3346.58, "total_tokens": 1334816} +{"current_steps": 1100, "total_steps": 179580, "loss": 1.0887, "lr": 3.0599175854772246e-06, "epoch": 0.12250807439581245, "percentage": 0.61, "elapsed_time": "0:06:40", "remaining_time": "18:03:31", "throughput": 3346.66, "total_tokens": 1340928} +{"current_steps": 1105, "total_steps": 179580, "loss": 0.919, "lr": 3.073838957567658e-06, "epoch": 0.12306492927942977, "percentage": 0.62, "elapsed_time": "0:06:42", "remaining_time": "18:03:21", "throughput": 3346.64, "total_tokens": 1346848} +{"current_steps": 1110, "total_steps": 179580, "loss": 0.985, "lr": 3.0877603296580915e-06, "epoch": 0.12362178416304712, "percentage": 0.62, "elapsed_time": "0:06:44", "remaining_time": "18:03:24", "throughput": 3346.94, "total_tokens": 1353152} +{"current_steps": 1115, "total_steps": 179580, "loss": 1.0243, "lr": 3.1016817017485246e-06, "epoch": 0.12417863904666444, "percentage": 0.62, "elapsed_time": "0:06:46", "remaining_time": "18:03:29", "throughput": 3347.07, "total_tokens": 1359456} +{"current_steps": 1120, "total_steps": 179580, "loss": 1.2815, "lr": 3.1156030738389577e-06, "epoch": 0.12473549393028177, "percentage": 0.62, "elapsed_time": "0:06:47", "remaining_time": "18:03:21", "throughput": 3347.04, "total_tokens": 1365408} +{"current_steps": 1125, "total_steps": 179580, "loss": 1.0013, "lr": 3.129524445929391e-06, "epoch": 0.12529234881389908, "percentage": 0.63, "elapsed_time": "0:06:49", "remaining_time": "18:03:23", "throughput": 3347.26, "total_tokens": 1371680} +{"current_steps": 1130, "total_steps": 179580, "loss": 1.1276, "lr": 3.1434458180198246e-06, "epoch": 0.12584920369751643, "percentage": 0.63, "elapsed_time": "0:06:51", "remaining_time": "18:03:29", "throughput": 3347.47, "total_tokens": 1378016} +{"current_steps": 1135, "total_steps": 179580, "loss": 1.3121, "lr": 3.1573671901102573e-06, "epoch": 0.12640605858113377, "percentage": 0.63, "elapsed_time": "0:06:53", "remaining_time": "18:03:24", "throughput": 3347.56, "total_tokens": 1384096} +{"current_steps": 1140, "total_steps": 179580, "loss": 1.1884, "lr": 3.1712885622006907e-06, "epoch": 0.12696291346475108, "percentage": 0.63, "elapsed_time": "0:06:55", "remaining_time": "18:03:24", "throughput": 3347.51, "total_tokens": 1390208} +{"current_steps": 1145, "total_steps": 179580, "loss": 1.2022, "lr": 3.185209934291124e-06, "epoch": 0.12751976834836842, "percentage": 0.64, "elapsed_time": "0:06:57", "remaining_time": "18:03:24", "throughput": 3347.47, "total_tokens": 1396320} +{"current_steps": 1150, "total_steps": 179580, "loss": 1.3862, "lr": 3.1991313063815573e-06, "epoch": 0.12807662323198574, "percentage": 0.64, "elapsed_time": "0:06:59", "remaining_time": "18:03:32", "throughput": 3347.45, "total_tokens": 1402624} +{"current_steps": 1155, "total_steps": 179580, "loss": 1.1531, "lr": 3.2130526784719903e-06, "epoch": 0.12863347811560308, "percentage": 0.64, "elapsed_time": "0:07:00", "remaining_time": "18:03:37", "throughput": 3347.38, "total_tokens": 1408832} +{"current_steps": 1160, "total_steps": 179580, "loss": 1.0271, "lr": 3.226974050562424e-06, "epoch": 0.1291903329992204, "percentage": 0.65, "elapsed_time": "0:07:02", "remaining_time": "18:03:45", "throughput": 3347.4, "total_tokens": 1415168} +{"current_steps": 1165, "total_steps": 179580, "loss": 1.0536, "lr": 3.2408954226528564e-06, "epoch": 0.12974718788283773, "percentage": 0.65, "elapsed_time": "0:07:04", "remaining_time": "18:03:38", "throughput": 3347.16, "total_tokens": 1421056} +{"current_steps": 1170, "total_steps": 179580, "loss": 1.0806, "lr": 3.25481679474329e-06, "epoch": 0.13030404276645507, "percentage": 0.65, "elapsed_time": "0:07:06", "remaining_time": "18:03:07", "throughput": 3346.85, "total_tokens": 1426368} +{"current_steps": 1175, "total_steps": 179580, "loss": 1.1828, "lr": 3.2687381668337234e-06, "epoch": 0.1308608976500724, "percentage": 0.65, "elapsed_time": "0:07:07", "remaining_time": "18:02:58", "throughput": 3346.65, "total_tokens": 1432224} +{"current_steps": 1180, "total_steps": 179580, "loss": 1.1127, "lr": 3.2826595389241565e-06, "epoch": 0.13141775253368973, "percentage": 0.66, "elapsed_time": "0:07:09", "remaining_time": "18:03:01", "throughput": 3346.88, "total_tokens": 1438528} +{"current_steps": 1185, "total_steps": 179580, "loss": 1.0669, "lr": 3.29658091101459e-06, "epoch": 0.13197460741730704, "percentage": 0.66, "elapsed_time": "0:07:11", "remaining_time": "18:02:45", "throughput": 3346.84, "total_tokens": 1444288} +{"current_steps": 1190, "total_steps": 179580, "loss": 1.3338, "lr": 3.310502283105023e-06, "epoch": 0.13253146230092439, "percentage": 0.66, "elapsed_time": "0:07:13", "remaining_time": "18:02:52", "throughput": 3347.07, "total_tokens": 1450688} +{"current_steps": 1195, "total_steps": 179580, "loss": 1.174, "lr": 3.3244236551954565e-06, "epoch": 0.1330883171845417, "percentage": 0.67, "elapsed_time": "0:07:15", "remaining_time": "18:02:49", "throughput": 3347.05, "total_tokens": 1456736} +{"current_steps": 1200, "total_steps": 179580, "loss": 1.094, "lr": 3.338345027285889e-06, "epoch": 0.13364517206815904, "percentage": 0.67, "elapsed_time": "0:07:17", "remaining_time": "18:02:54", "throughput": 3347.04, "total_tokens": 1462976} +{"current_steps": 1205, "total_steps": 179580, "loss": 1.1936, "lr": 3.3522663993763226e-06, "epoch": 0.13420202695177635, "percentage": 0.67, "elapsed_time": "0:07:18", "remaining_time": "18:02:27", "throughput": 3347.06, "total_tokens": 1468512} +{"current_steps": 1210, "total_steps": 179580, "loss": 1.1879, "lr": 3.366187771466756e-06, "epoch": 0.1347588818353937, "percentage": 0.67, "elapsed_time": "0:07:20", "remaining_time": "18:02:27", "throughput": 3347.02, "total_tokens": 1474624} +{"current_steps": 1215, "total_steps": 179580, "loss": 1.0681, "lr": 3.380109143557189e-06, "epoch": 0.13531573671901104, "percentage": 0.68, "elapsed_time": "0:07:22", "remaining_time": "18:02:43", "throughput": 3347.11, "total_tokens": 1481184} +{"current_steps": 1220, "total_steps": 179580, "loss": 1.0111, "lr": 3.3940305156476226e-06, "epoch": 0.13587259160262835, "percentage": 0.68, "elapsed_time": "0:07:24", "remaining_time": "18:02:41", "throughput": 3347.26, "total_tokens": 1487328} +{"current_steps": 1225, "total_steps": 179580, "loss": 1.0403, "lr": 3.4079518877380557e-06, "epoch": 0.1364294464862457, "percentage": 0.68, "elapsed_time": "0:07:26", "remaining_time": "18:02:42", "throughput": 3347.41, "total_tokens": 1493568} +{"current_steps": 1230, "total_steps": 179580, "loss": 1.1796, "lr": 3.421873259828489e-06, "epoch": 0.136986301369863, "percentage": 0.68, "elapsed_time": "0:07:28", "remaining_time": "18:02:43", "throughput": 3347.47, "total_tokens": 1499744} +{"current_steps": 1235, "total_steps": 179580, "loss": 0.9163, "lr": 3.435794631918922e-06, "epoch": 0.13754315625348035, "percentage": 0.69, "elapsed_time": "0:07:29", "remaining_time": "18:02:49", "throughput": 3347.66, "total_tokens": 1506112} +{"current_steps": 1240, "total_steps": 179580, "loss": 0.9197, "lr": 3.4497160040093553e-06, "epoch": 0.13810001113709766, "percentage": 0.69, "elapsed_time": "0:07:31", "remaining_time": "18:02:52", "throughput": 3347.6, "total_tokens": 1512288} +{"current_steps": 1245, "total_steps": 179580, "loss": 1.0641, "lr": 3.4636373760997883e-06, "epoch": 0.138656866020715, "percentage": 0.69, "elapsed_time": "0:07:33", "remaining_time": "18:02:52", "throughput": 3347.66, "total_tokens": 1518464} +{"current_steps": 1250, "total_steps": 179580, "loss": 0.9883, "lr": 3.477558748190222e-06, "epoch": 0.13921372090433234, "percentage": 0.7, "elapsed_time": "0:07:35", "remaining_time": "18:02:45", "throughput": 3347.82, "total_tokens": 1524512} +{"current_steps": 1255, "total_steps": 179580, "loss": 0.9632, "lr": 3.4914801202806553e-06, "epoch": 0.13977057578794966, "percentage": 0.7, "elapsed_time": "0:07:37", "remaining_time": "18:02:51", "throughput": 3347.96, "total_tokens": 1530848} +{"current_steps": 1260, "total_steps": 179580, "loss": 0.762, "lr": 3.5054014923710884e-06, "epoch": 0.140327430671567, "percentage": 0.7, "elapsed_time": "0:07:39", "remaining_time": "18:02:52", "throughput": 3348.06, "total_tokens": 1537056} +{"current_steps": 1265, "total_steps": 179580, "loss": 1.1646, "lr": 3.519322864461522e-06, "epoch": 0.1408842855551843, "percentage": 0.7, "elapsed_time": "0:07:40", "remaining_time": "18:02:36", "throughput": 3348.18, "total_tokens": 1542880} +{"current_steps": 1270, "total_steps": 179580, "loss": 0.7351, "lr": 3.5332442365519545e-06, "epoch": 0.14144114043880165, "percentage": 0.71, "elapsed_time": "0:07:42", "remaining_time": "18:02:41", "throughput": 3348.35, "total_tokens": 1549216} +{"current_steps": 1275, "total_steps": 179580, "loss": 0.9456, "lr": 3.547165608642388e-06, "epoch": 0.14199799532241897, "percentage": 0.71, "elapsed_time": "0:07:44", "remaining_time": "18:02:37", "throughput": 3348.17, "total_tokens": 1555200} +{"current_steps": 1280, "total_steps": 179580, "loss": 0.7953, "lr": 3.561086980732821e-06, "epoch": 0.1425548502060363, "percentage": 0.71, "elapsed_time": "0:07:46", "remaining_time": "18:02:34", "throughput": 3348.14, "total_tokens": 1561248} +{"current_steps": 1285, "total_steps": 179580, "loss": 0.7831, "lr": 3.5750083528232545e-06, "epoch": 0.14311170508965362, "percentage": 0.72, "elapsed_time": "0:07:48", "remaining_time": "18:02:34", "throughput": 3348.09, "total_tokens": 1567360} +{"current_steps": 1290, "total_steps": 179580, "loss": 0.7957, "lr": 3.588929724913688e-06, "epoch": 0.14366855997327097, "percentage": 0.72, "elapsed_time": "0:07:49", "remaining_time": "18:02:34", "throughput": 3348.01, "total_tokens": 1573472} +{"current_steps": 1295, "total_steps": 179580, "loss": 0.9654, "lr": 3.602851097004121e-06, "epoch": 0.1442254148568883, "percentage": 0.72, "elapsed_time": "0:07:51", "remaining_time": "18:02:09", "throughput": 3348.15, "total_tokens": 1579072} +{"current_steps": 1300, "total_steps": 179580, "loss": 0.8836, "lr": 3.6167724690945545e-06, "epoch": 0.14478226974050562, "percentage": 0.72, "elapsed_time": "0:07:53", "remaining_time": "18:02:05", "throughput": 3348.1, "total_tokens": 1585088} +{"current_steps": 1305, "total_steps": 179580, "loss": 0.5754, "lr": 3.630693841184987e-06, "epoch": 0.14533912462412296, "percentage": 0.73, "elapsed_time": "0:07:55", "remaining_time": "18:02:02", "throughput": 3348.27, "total_tokens": 1591232} +{"current_steps": 1310, "total_steps": 179580, "loss": 0.9072, "lr": 3.6446152132754206e-06, "epoch": 0.14589597950774028, "percentage": 0.73, "elapsed_time": "0:07:56", "remaining_time": "18:01:36", "throughput": 3348.27, "total_tokens": 1596736} +{"current_steps": 1315, "total_steps": 179580, "loss": 0.9047, "lr": 3.6585365853658537e-06, "epoch": 0.14645283439135762, "percentage": 0.73, "elapsed_time": "0:07:58", "remaining_time": "18:01:47", "throughput": 3348.52, "total_tokens": 1603264} +{"current_steps": 1320, "total_steps": 179580, "loss": 0.6811, "lr": 3.672457957456287e-06, "epoch": 0.14700968927497493, "percentage": 0.74, "elapsed_time": "0:08:00", "remaining_time": "18:01:22", "throughput": 3348.19, "total_tokens": 1608640} +{"current_steps": 1325, "total_steps": 179580, "loss": 0.6591, "lr": 3.68637932954672e-06, "epoch": 0.14756654415859227, "percentage": 0.74, "elapsed_time": "0:08:02", "remaining_time": "18:00:57", "throughput": 3348.22, "total_tokens": 1614176} +{"current_steps": 1330, "total_steps": 179580, "loss": 0.7481, "lr": 3.7003007016371537e-06, "epoch": 0.1481233990422096, "percentage": 0.74, "elapsed_time": "0:08:03", "remaining_time": "18:00:59", "throughput": 3348.36, "total_tokens": 1620416} +{"current_steps": 1335, "total_steps": 179580, "loss": 0.7295, "lr": 3.714222073727587e-06, "epoch": 0.14868025392582693, "percentage": 0.74, "elapsed_time": "0:08:05", "remaining_time": "18:01:00", "throughput": 3348.43, "total_tokens": 1626624} +{"current_steps": 1340, "total_steps": 179580, "loss": 0.7115, "lr": 3.72814344581802e-06, "epoch": 0.14923710880944427, "percentage": 0.75, "elapsed_time": "0:08:07", "remaining_time": "18:01:08", "throughput": 3348.37, "total_tokens": 1632928} +{"current_steps": 1345, "total_steps": 179580, "loss": 0.6846, "lr": 3.7420648179084533e-06, "epoch": 0.14979396369306158, "percentage": 0.75, "elapsed_time": "0:08:09", "remaining_time": "18:01:05", "throughput": 3348.39, "total_tokens": 1639008} +{"current_steps": 1350, "total_steps": 179580, "loss": 0.3983, "lr": 3.7559861899988864e-06, "epoch": 0.15035081857667892, "percentage": 0.75, "elapsed_time": "0:08:11", "remaining_time": "18:00:59", "throughput": 3348.52, "total_tokens": 1645056} +{"current_steps": 1355, "total_steps": 179580, "loss": 0.4649, "lr": 3.76990756208932e-06, "epoch": 0.15090767346029624, "percentage": 0.75, "elapsed_time": "0:08:13", "remaining_time": "18:00:58", "throughput": 3348.46, "total_tokens": 1651136} +{"current_steps": 1360, "total_steps": 179580, "loss": 0.9049, "lr": 3.7838289341797525e-06, "epoch": 0.15146452834391358, "percentage": 0.76, "elapsed_time": "0:08:14", "remaining_time": "18:01:03", "throughput": 3348.54, "total_tokens": 1657440} +{"current_steps": 1365, "total_steps": 179580, "loss": 0.6586, "lr": 3.7977503062701864e-06, "epoch": 0.1520213832275309, "percentage": 0.76, "elapsed_time": "0:08:16", "remaining_time": "18:01:13", "throughput": 3348.84, "total_tokens": 1664000} +{"current_steps": 1370, "total_steps": 179580, "loss": 0.8186, "lr": 3.81167167836062e-06, "epoch": 0.15257823811114823, "percentage": 0.76, "elapsed_time": "0:08:18", "remaining_time": "18:00:59", "throughput": 3348.93, "total_tokens": 1669824} +{"current_steps": 1375, "total_steps": 179580, "loss": 0.4668, "lr": 3.825593050451053e-06, "epoch": 0.15313509299476558, "percentage": 0.77, "elapsed_time": "0:08:20", "remaining_time": "18:00:51", "throughput": 3348.92, "total_tokens": 1675744} +{"current_steps": 1380, "total_steps": 179580, "loss": 0.6046, "lr": 3.839514422541486e-06, "epoch": 0.1536919478783829, "percentage": 0.77, "elapsed_time": "0:08:22", "remaining_time": "18:00:48", "throughput": 3349.03, "total_tokens": 1681856} +{"current_steps": 1385, "total_steps": 179580, "loss": 0.7284, "lr": 3.853435794631919e-06, "epoch": 0.15424880276200023, "percentage": 0.77, "elapsed_time": "0:08:24", "remaining_time": "18:01:01", "throughput": 3349.23, "total_tokens": 1688448} +{"current_steps": 1390, "total_steps": 179580, "loss": 0.7467, "lr": 3.8673571667223525e-06, "epoch": 0.15480565764561754, "percentage": 0.77, "elapsed_time": "0:08:25", "remaining_time": "18:00:51", "throughput": 3349.19, "total_tokens": 1694304} +{"current_steps": 1395, "total_steps": 179580, "loss": 0.6433, "lr": 3.881278538812785e-06, "epoch": 0.1553625125292349, "percentage": 0.78, "elapsed_time": "0:08:27", "remaining_time": "18:00:51", "throughput": 3349.12, "total_tokens": 1700416} +{"current_steps": 1400, "total_steps": 179580, "loss": 0.4551, "lr": 3.895199910903219e-06, "epoch": 0.1559193674128522, "percentage": 0.78, "elapsed_time": "0:08:29", "remaining_time": "18:00:52", "throughput": 3349.2, "total_tokens": 1706624} +{"current_steps": 1405, "total_steps": 179580, "loss": 0.4186, "lr": 3.909121282993652e-06, "epoch": 0.15647622229646954, "percentage": 0.78, "elapsed_time": "0:08:31", "remaining_time": "18:00:52", "throughput": 3349.17, "total_tokens": 1712736} +{"current_steps": 1410, "total_steps": 179580, "loss": 0.503, "lr": 3.923042655084086e-06, "epoch": 0.15703307718008688, "percentage": 0.79, "elapsed_time": "0:08:33", "remaining_time": "18:00:57", "throughput": 3349.09, "total_tokens": 1718976} +{"current_steps": 1415, "total_steps": 179580, "loss": 0.611, "lr": 3.936964027174519e-06, "epoch": 0.1575899320637042, "percentage": 0.79, "elapsed_time": "0:08:34", "remaining_time": "18:00:43", "throughput": 3349.01, "total_tokens": 1724704} +{"current_steps": 1420, "total_steps": 179580, "loss": 0.5907, "lr": 3.950885399264952e-06, "epoch": 0.15814678694732154, "percentage": 0.79, "elapsed_time": "0:08:36", "remaining_time": "18:00:42", "throughput": 3348.85, "total_tokens": 1730752} +{"current_steps": 1425, "total_steps": 179580, "loss": 0.6027, "lr": 3.964806771355385e-06, "epoch": 0.15870364183093885, "percentage": 0.79, "elapsed_time": "0:08:38", "remaining_time": "18:00:39", "throughput": 3348.93, "total_tokens": 1736864} +{"current_steps": 1430, "total_steps": 179580, "loss": 0.7508, "lr": 3.978728143445818e-06, "epoch": 0.1592604967145562, "percentage": 0.8, "elapsed_time": "0:08:40", "remaining_time": "18:00:22", "throughput": 3348.86, "total_tokens": 1742496} +{"current_steps": 1435, "total_steps": 179580, "loss": 0.4867, "lr": 3.992649515536251e-06, "epoch": 0.1598173515981735, "percentage": 0.8, "elapsed_time": "0:08:42", "remaining_time": "18:00:17", "throughput": 3348.79, "total_tokens": 1748480} +{"current_steps": 1440, "total_steps": 179580, "loss": 0.4428, "lr": 4.006570887626685e-06, "epoch": 0.16037420648179085, "percentage": 0.8, "elapsed_time": "0:08:43", "remaining_time": "18:00:15", "throughput": 3348.73, "total_tokens": 1754528} +{"current_steps": 1445, "total_steps": 179580, "loss": 0.5508, "lr": 4.020492259717118e-06, "epoch": 0.16093106136540816, "percentage": 0.8, "elapsed_time": "0:08:45", "remaining_time": "18:00:20", "throughput": 3348.88, "total_tokens": 1760896} +{"current_steps": 1450, "total_steps": 179580, "loss": 0.4112, "lr": 4.034413631807551e-06, "epoch": 0.1614879162490255, "percentage": 0.81, "elapsed_time": "0:08:47", "remaining_time": "18:00:09", "throughput": 3348.77, "total_tokens": 1766656} +{"current_steps": 1455, "total_steps": 179580, "loss": 0.2568, "lr": 4.048335003897984e-06, "epoch": 0.16204477113264285, "percentage": 0.81, "elapsed_time": "0:08:49", "remaining_time": "18:00:02", "throughput": 3348.81, "total_tokens": 1772640} +{"current_steps": 1460, "total_steps": 179580, "loss": 0.5076, "lr": 4.062256375988418e-06, "epoch": 0.16260162601626016, "percentage": 0.81, "elapsed_time": "0:08:51", "remaining_time": "17:59:57", "throughput": 3348.66, "total_tokens": 1778560} +{"current_steps": 1465, "total_steps": 179580, "loss": 0.5197, "lr": 4.0761777480788505e-06, "epoch": 0.1631584808998775, "percentage": 0.82, "elapsed_time": "0:08:52", "remaining_time": "17:59:51", "throughput": 3348.79, "total_tokens": 1784608} +{"current_steps": 1470, "total_steps": 179580, "loss": 0.2842, "lr": 4.090099120169284e-06, "epoch": 0.16371533578349481, "percentage": 0.82, "elapsed_time": "0:08:54", "remaining_time": "17:59:47", "throughput": 3348.7, "total_tokens": 1790592} +{"current_steps": 1475, "total_steps": 179580, "loss": 0.3889, "lr": 4.1040204922597175e-06, "epoch": 0.16427219066711216, "percentage": 0.82, "elapsed_time": "0:08:56", "remaining_time": "17:59:43", "throughput": 3348.61, "total_tokens": 1796576} +{"current_steps": 1480, "total_steps": 179580, "loss": 0.5041, "lr": 4.117941864350151e-06, "epoch": 0.16482904555072947, "percentage": 0.82, "elapsed_time": "0:08:58", "remaining_time": "17:59:45", "throughput": 3348.47, "total_tokens": 1802688} +{"current_steps": 1485, "total_steps": 179580, "loss": 0.3398, "lr": 4.131863236440584e-06, "epoch": 0.1653859004343468, "percentage": 0.83, "elapsed_time": "0:09:00", "remaining_time": "17:59:53", "throughput": 3348.48, "total_tokens": 1809056} +{"current_steps": 1490, "total_steps": 179580, "loss": 0.5017, "lr": 4.145784608531017e-06, "epoch": 0.16594275531796415, "percentage": 0.83, "elapsed_time": "0:09:02", "remaining_time": "17:59:48", "throughput": 3348.42, "total_tokens": 1815040} +{"current_steps": 1495, "total_steps": 179580, "loss": 0.6191, "lr": 4.1597059806214505e-06, "epoch": 0.16649961020158147, "percentage": 0.83, "elapsed_time": "0:09:03", "remaining_time": "17:59:50", "throughput": 3348.32, "total_tokens": 1821184} +{"current_steps": 1500, "total_steps": 179580, "loss": 0.5421, "lr": 4.173627352711883e-06, "epoch": 0.1670564650851988, "percentage": 0.84, "elapsed_time": "0:09:05", "remaining_time": "17:59:50", "throughput": 3348.37, "total_tokens": 1827360} +{"current_steps": 1505, "total_steps": 179580, "loss": 0.6814, "lr": 4.187548724802317e-06, "epoch": 0.16761331996881612, "percentage": 0.84, "elapsed_time": "0:09:07", "remaining_time": "17:59:48", "throughput": 3348.45, "total_tokens": 1833472} +{"current_steps": 1510, "total_steps": 179580, "loss": 0.3186, "lr": 4.20147009689275e-06, "epoch": 0.16817017485243346, "percentage": 0.84, "elapsed_time": "0:09:09", "remaining_time": "17:59:36", "throughput": 3348.43, "total_tokens": 1839264} +{"current_steps": 1515, "total_steps": 179580, "loss": 0.4695, "lr": 4.215391468983184e-06, "epoch": 0.16872702973605078, "percentage": 0.84, "elapsed_time": "0:09:11", "remaining_time": "17:59:40", "throughput": 3348.55, "total_tokens": 1845600} +{"current_steps": 1520, "total_steps": 179580, "loss": 0.4132, "lr": 4.229312841073616e-06, "epoch": 0.16928388461966812, "percentage": 0.85, "elapsed_time": "0:09:13", "remaining_time": "17:59:55", "throughput": 3348.7, "total_tokens": 1852256} +{"current_steps": 1525, "total_steps": 179580, "loss": 0.4069, "lr": 4.24323421316405e-06, "epoch": 0.16984073950328543, "percentage": 0.85, "elapsed_time": "0:09:14", "remaining_time": "17:59:53", "throughput": 3348.8, "total_tokens": 1858400} +{"current_steps": 1530, "total_steps": 179580, "loss": 0.5903, "lr": 4.257155585254482e-06, "epoch": 0.17039759438690277, "percentage": 0.85, "elapsed_time": "0:09:16", "remaining_time": "17:59:34", "throughput": 3348.72, "total_tokens": 1863936} +{"current_steps": 1535, "total_steps": 179580, "loss": 0.2138, "lr": 4.271076957344916e-06, "epoch": 0.17095444927052011, "percentage": 0.85, "elapsed_time": "0:09:18", "remaining_time": "17:59:26", "throughput": 3348.61, "total_tokens": 1869792} +{"current_steps": 1540, "total_steps": 179580, "loss": 0.1948, "lr": 4.284998329435349e-06, "epoch": 0.17151130415413743, "percentage": 0.86, "elapsed_time": "0:09:20", "remaining_time": "17:59:23", "throughput": 3348.74, "total_tokens": 1875936} +{"current_steps": 1545, "total_steps": 179580, "loss": 0.3159, "lr": 4.298919701525783e-06, "epoch": 0.17206815903775477, "percentage": 0.86, "elapsed_time": "0:09:21", "remaining_time": "17:59:17", "throughput": 3348.81, "total_tokens": 1881920} +{"current_steps": 1550, "total_steps": 179580, "loss": 0.3217, "lr": 4.312841073616216e-06, "epoch": 0.17262501392137208, "percentage": 0.86, "elapsed_time": "0:09:23", "remaining_time": "17:59:20", "throughput": 3348.79, "total_tokens": 1888160} +{"current_steps": 1555, "total_steps": 179580, "loss": 0.2416, "lr": 4.326762445706649e-06, "epoch": 0.17318186880498943, "percentage": 0.87, "elapsed_time": "0:09:25", "remaining_time": "17:59:18", "throughput": 3348.74, "total_tokens": 1894208} +{"current_steps": 1560, "total_steps": 179580, "loss": 0.3791, "lr": 4.340683817797082e-06, "epoch": 0.17373872368860674, "percentage": 0.87, "elapsed_time": "0:09:27", "remaining_time": "17:59:21", "throughput": 3348.75, "total_tokens": 1900448} +{"current_steps": 1565, "total_steps": 179580, "loss": 0.6201, "lr": 4.354605189887515e-06, "epoch": 0.17429557857222408, "percentage": 0.87, "elapsed_time": "0:09:29", "remaining_time": "17:59:21", "throughput": 3348.79, "total_tokens": 1906624} +{"current_steps": 1570, "total_steps": 179580, "loss": 0.4133, "lr": 4.3685265619779485e-06, "epoch": 0.1748524334558414, "percentage": 0.87, "elapsed_time": "0:09:31", "remaining_time": "17:59:18", "throughput": 3348.81, "total_tokens": 1912672} +{"current_steps": 1575, "total_steps": 179580, "loss": 0.5123, "lr": 4.382447934068382e-06, "epoch": 0.17540928833945874, "percentage": 0.88, "elapsed_time": "0:09:33", "remaining_time": "17:59:20", "throughput": 3348.77, "total_tokens": 1918880} +{"current_steps": 1580, "total_steps": 179580, "loss": 0.3219, "lr": 4.3963693061588155e-06, "epoch": 0.17596614322307608, "percentage": 0.88, "elapsed_time": "0:09:34", "remaining_time": "17:59:23", "throughput": 3348.79, "total_tokens": 1925120} +{"current_steps": 1585, "total_steps": 179580, "loss": 0.3749, "lr": 4.410290678249249e-06, "epoch": 0.1765229981066934, "percentage": 0.88, "elapsed_time": "0:09:36", "remaining_time": "17:59:20", "throughput": 3348.59, "total_tokens": 1931040} +{"current_steps": 1590, "total_steps": 179580, "loss": 0.2577, "lr": 4.424212050339682e-06, "epoch": 0.17707985299031073, "percentage": 0.89, "elapsed_time": "0:09:38", "remaining_time": "17:59:21", "throughput": 3348.68, "total_tokens": 1937280} +{"current_steps": 1595, "total_steps": 179580, "loss": 0.6866, "lr": 4.438133422430115e-06, "epoch": 0.17763670787392805, "percentage": 0.89, "elapsed_time": "0:09:40", "remaining_time": "17:59:21", "throughput": 3348.68, "total_tokens": 1943424} +{"current_steps": 1600, "total_steps": 179580, "loss": 0.2686, "lr": 4.452054794520548e-06, "epoch": 0.1781935627575454, "percentage": 0.89, "elapsed_time": "0:09:42", "remaining_time": "17:59:21", "throughput": 3348.63, "total_tokens": 1949536} +{"current_steps": 1605, "total_steps": 179580, "loss": 0.3697, "lr": 4.465976166610981e-06, "epoch": 0.1787504176411627, "percentage": 0.89, "elapsed_time": "0:09:43", "remaining_time": "17:59:17", "throughput": 3348.57, "total_tokens": 1955520} +{"current_steps": 1610, "total_steps": 179580, "loss": 0.2921, "lr": 4.479897538701415e-06, "epoch": 0.17930727252478004, "percentage": 0.9, "elapsed_time": "0:09:45", "remaining_time": "17:58:58", "throughput": 3348.52, "total_tokens": 1961088} +{"current_steps": 1615, "total_steps": 179580, "loss": 0.2674, "lr": 4.493818910791848e-06, "epoch": 0.17986412740839738, "percentage": 0.9, "elapsed_time": "0:09:47", "remaining_time": "17:59:03", "throughput": 3348.42, "total_tokens": 1967328} +{"current_steps": 1620, "total_steps": 179580, "loss": 0.502, "lr": 4.507740282882282e-06, "epoch": 0.1804209822920147, "percentage": 0.9, "elapsed_time": "0:09:49", "remaining_time": "17:58:56", "throughput": 3348.35, "total_tokens": 1973216} +{"current_steps": 1625, "total_steps": 179580, "loss": 0.2848, "lr": 4.521661654972714e-06, "epoch": 0.18097783717563204, "percentage": 0.9, "elapsed_time": "0:09:51", "remaining_time": "17:58:42", "throughput": 3348.1, "total_tokens": 1978784} +{"current_steps": 1630, "total_steps": 179580, "loss": 0.4877, "lr": 4.535583027063148e-06, "epoch": 0.18153469205924935, "percentage": 0.91, "elapsed_time": "0:09:52", "remaining_time": "17:58:47", "throughput": 3348.13, "total_tokens": 1985088} +{"current_steps": 1635, "total_steps": 179580, "loss": 0.3934, "lr": 4.54950439915358e-06, "epoch": 0.1820915469428667, "percentage": 0.91, "elapsed_time": "0:09:54", "remaining_time": "17:58:47", "throughput": 3348.16, "total_tokens": 1991264} +{"current_steps": 1640, "total_steps": 179580, "loss": 0.4358, "lr": 4.563425771244014e-06, "epoch": 0.182648401826484, "percentage": 0.91, "elapsed_time": "0:09:56", "remaining_time": "17:58:41", "throughput": 3348.16, "total_tokens": 1997216} +{"current_steps": 1645, "total_steps": 179580, "loss": 0.2377, "lr": 4.577347143334447e-06, "epoch": 0.18320525671010135, "percentage": 0.92, "elapsed_time": "0:09:58", "remaining_time": "17:58:32", "throughput": 3347.87, "total_tokens": 2002912} +{"current_steps": 1650, "total_steps": 179580, "loss": 0.3776, "lr": 4.591268515424881e-06, "epoch": 0.18376211159371866, "percentage": 0.92, "elapsed_time": "0:10:00", "remaining_time": "17:58:37", "throughput": 3347.99, "total_tokens": 2009280} +{"current_steps": 1655, "total_steps": 179580, "loss": 0.336, "lr": 4.605189887515314e-06, "epoch": 0.184318966477336, "percentage": 0.92, "elapsed_time": "0:10:01", "remaining_time": "17:58:31", "throughput": 3348.09, "total_tokens": 2015296} +{"current_steps": 1660, "total_steps": 179580, "loss": 0.2888, "lr": 4.619111259605747e-06, "epoch": 0.18487582136095335, "percentage": 0.92, "elapsed_time": "0:10:03", "remaining_time": "17:58:35", "throughput": 3348.2, "total_tokens": 2021632} +{"current_steps": 1665, "total_steps": 179580, "loss": 0.3431, "lr": 4.6330326316961804e-06, "epoch": 0.18543267624457066, "percentage": 0.93, "elapsed_time": "0:10:05", "remaining_time": "17:58:35", "throughput": 3348.24, "total_tokens": 2027808} +{"current_steps": 1670, "total_steps": 179580, "loss": 0.3771, "lr": 4.646954003786613e-06, "epoch": 0.185989531128188, "percentage": 0.93, "elapsed_time": "0:10:07", "remaining_time": "17:58:37", "throughput": 3348.19, "total_tokens": 2033984} +{"current_steps": 1675, "total_steps": 179580, "loss": 0.3564, "lr": 4.6608753758770466e-06, "epoch": 0.18654638601180532, "percentage": 0.93, "elapsed_time": "0:10:09", "remaining_time": "17:58:27", "throughput": 3348.13, "total_tokens": 2039776} +{"current_steps": 1680, "total_steps": 179580, "loss": 0.4029, "lr": 4.67479674796748e-06, "epoch": 0.18710324089542266, "percentage": 0.94, "elapsed_time": "0:10:11", "remaining_time": "17:58:27", "throughput": 3348.09, "total_tokens": 2045888} +{"current_steps": 1685, "total_steps": 179580, "loss": 0.3496, "lr": 4.6887181200579135e-06, "epoch": 0.18766009577903997, "percentage": 0.94, "elapsed_time": "0:10:12", "remaining_time": "17:58:14", "throughput": 3347.94, "total_tokens": 2051552} +{"current_steps": 1690, "total_steps": 179580, "loss": 0.3618, "lr": 4.702639492148346e-06, "epoch": 0.1882169506626573, "percentage": 0.94, "elapsed_time": "0:10:14", "remaining_time": "17:58:12", "throughput": 3348.05, "total_tokens": 2057696} +{"current_steps": 1695, "total_steps": 179580, "loss": 0.5559, "lr": 4.71656086423878e-06, "epoch": 0.18877380554627465, "percentage": 0.94, "elapsed_time": "0:10:16", "remaining_time": "17:58:06", "throughput": 3348.06, "total_tokens": 2063648} +{"current_steps": 1700, "total_steps": 179580, "loss": 0.3409, "lr": 4.730482236329213e-06, "epoch": 0.18933066042989197, "percentage": 0.95, "elapsed_time": "0:10:18", "remaining_time": "17:58:07", "throughput": 3348.16, "total_tokens": 2069888} +{"current_steps": 1705, "total_steps": 179580, "loss": 0.3511, "lr": 4.744403608419646e-06, "epoch": 0.1898875153135093, "percentage": 0.95, "elapsed_time": "0:10:20", "remaining_time": "17:58:05", "throughput": 3348.24, "total_tokens": 2076032} +{"current_steps": 1710, "total_steps": 179580, "loss": 0.3835, "lr": 4.758324980510079e-06, "epoch": 0.19044437019712662, "percentage": 0.95, "elapsed_time": "0:10:21", "remaining_time": "17:57:52", "throughput": 3348.06, "total_tokens": 2081632} +{"current_steps": 1715, "total_steps": 179580, "loss": 0.22, "lr": 4.772246352600513e-06, "epoch": 0.19100122508074396, "percentage": 0.96, "elapsed_time": "0:10:23", "remaining_time": "17:57:49", "throughput": 3348.12, "total_tokens": 2087744} +{"current_steps": 1720, "total_steps": 179580, "loss": 0.3326, "lr": 4.786167724690946e-06, "epoch": 0.19155807996436128, "percentage": 0.96, "elapsed_time": "0:10:25", "remaining_time": "17:57:47", "throughput": 3348.14, "total_tokens": 2093824} +{"current_steps": 1725, "total_steps": 179580, "loss": 0.5653, "lr": 4.800089096781379e-06, "epoch": 0.19211493484797862, "percentage": 0.96, "elapsed_time": "0:10:27", "remaining_time": "17:57:47", "throughput": 3348.1, "total_tokens": 2099936} +{"current_steps": 1730, "total_steps": 179580, "loss": 0.5927, "lr": 4.814010468871812e-06, "epoch": 0.19267178973159593, "percentage": 0.96, "elapsed_time": "0:10:29", "remaining_time": "17:57:48", "throughput": 3347.98, "total_tokens": 2106048} +{"current_steps": 1735, "total_steps": 179580, "loss": 0.4022, "lr": 4.827931840962246e-06, "epoch": 0.19322864461521327, "percentage": 0.97, "elapsed_time": "0:10:30", "remaining_time": "17:57:45", "throughput": 3348.0, "total_tokens": 2112096} +{"current_steps": 1740, "total_steps": 179580, "loss": 0.248, "lr": 4.8418532130526784e-06, "epoch": 0.19378549949883062, "percentage": 0.97, "elapsed_time": "0:10:32", "remaining_time": "17:57:42", "throughput": 3347.94, "total_tokens": 2118112} +{"current_steps": 1745, "total_steps": 179580, "loss": 0.1881, "lr": 4.855774585143112e-06, "epoch": 0.19434235438244793, "percentage": 0.97, "elapsed_time": "0:10:34", "remaining_time": "17:57:48", "throughput": 3347.92, "total_tokens": 2124448} +{"current_steps": 1750, "total_steps": 179580, "loss": 0.2378, "lr": 4.869695957233545e-06, "epoch": 0.19489920926606527, "percentage": 0.97, "elapsed_time": "0:10:36", "remaining_time": "17:57:41", "throughput": 3347.76, "total_tokens": 2130272} +{"current_steps": 1755, "total_steps": 179580, "loss": 0.2634, "lr": 4.883617329323979e-06, "epoch": 0.19545606414968258, "percentage": 0.98, "elapsed_time": "0:10:38", "remaining_time": "17:57:42", "throughput": 3347.78, "total_tokens": 2136448} +{"current_steps": 1760, "total_steps": 179580, "loss": 0.2084, "lr": 4.8975387014144115e-06, "epoch": 0.19601291903329993, "percentage": 0.98, "elapsed_time": "0:10:39", "remaining_time": "17:57:36", "throughput": 3347.77, "total_tokens": 2142400} +{"current_steps": 1765, "total_steps": 179580, "loss": 0.2534, "lr": 4.911460073504845e-06, "epoch": 0.19656977391691724, "percentage": 0.98, "elapsed_time": "0:10:41", "remaining_time": "17:57:43", "throughput": 3347.91, "total_tokens": 2148864} +{"current_steps": 1770, "total_steps": 179580, "loss": 0.2862, "lr": 4.925381445595278e-06, "epoch": 0.19712662880053458, "percentage": 0.99, "elapsed_time": "0:10:43", "remaining_time": "17:57:40", "throughput": 3347.97, "total_tokens": 2154944} +{"current_steps": 1775, "total_steps": 179580, "loss": 0.4655, "lr": 4.939302817685711e-06, "epoch": 0.19768348368415192, "percentage": 0.99, "elapsed_time": "0:10:45", "remaining_time": "17:57:37", "throughput": 3348.0, "total_tokens": 2161024} +{"current_steps": 1780, "total_steps": 179580, "loss": 0.3978, "lr": 4.953224189776145e-06, "epoch": 0.19824033856776924, "percentage": 0.99, "elapsed_time": "0:10:47", "remaining_time": "17:57:38", "throughput": 3348.13, "total_tokens": 2167296} +{"current_steps": 1785, "total_steps": 179580, "loss": 0.5431, "lr": 4.967145561866578e-06, "epoch": 0.19879719345138658, "percentage": 0.99, "elapsed_time": "0:10:49", "remaining_time": "17:57:42", "throughput": 3348.27, "total_tokens": 2173664} +{"current_steps": 1790, "total_steps": 179580, "loss": 0.3384, "lr": 4.9810669339570116e-06, "epoch": 0.1993540483350039, "percentage": 1.0, "elapsed_time": "0:10:50", "remaining_time": "17:57:38", "throughput": 3348.15, "total_tokens": 2179616} +{"current_steps": 1795, "total_steps": 179580, "loss": 0.4324, "lr": 4.994988306047444e-06, "epoch": 0.19991090321862123, "percentage": 1.0, "elapsed_time": "0:10:52", "remaining_time": "17:57:35", "throughput": 3348.14, "total_tokens": 2185632} +{"current_steps": 1800, "total_steps": 179580, "loss": 0.401, "lr": 5.008909678137878e-06, "epoch": 0.20046775810223855, "percentage": 1.0, "elapsed_time": "0:10:54", "remaining_time": "17:57:30", "throughput": 3348.02, "total_tokens": 2191552} +{"current_steps": 1805, "total_steps": 179580, "loss": 0.2739, "lr": 5.02283105022831e-06, "epoch": 0.2010246129858559, "percentage": 1.01, "elapsed_time": "0:10:56", "remaining_time": "17:57:19", "throughput": 3347.94, "total_tokens": 2197280} +{"current_steps": 1810, "total_steps": 179580, "loss": 0.3497, "lr": 5.036752422318744e-06, "epoch": 0.2015814678694732, "percentage": 1.01, "elapsed_time": "0:10:58", "remaining_time": "17:57:26", "throughput": 3348.05, "total_tokens": 2203712} +{"current_steps": 1815, "total_steps": 179580, "loss": 0.2038, "lr": 5.050673794409177e-06, "epoch": 0.20213832275309054, "percentage": 1.01, "elapsed_time": "0:11:00", "remaining_time": "17:57:26", "throughput": 3348.11, "total_tokens": 2209920} +{"current_steps": 1820, "total_steps": 179580, "loss": 0.3487, "lr": 5.064595166499611e-06, "epoch": 0.20269517763670789, "percentage": 1.01, "elapsed_time": "0:11:01", "remaining_time": "17:57:22", "throughput": 3347.92, "total_tokens": 2215808} +{"current_steps": 1825, "total_steps": 179580, "loss": 0.3292, "lr": 5.078516538590044e-06, "epoch": 0.2032520325203252, "percentage": 1.02, "elapsed_time": "0:11:03", "remaining_time": "17:57:29", "throughput": 3348.02, "total_tokens": 2222240} +{"current_steps": 1830, "total_steps": 179580, "loss": 0.1464, "lr": 5.092437910680477e-06, "epoch": 0.20380888740394254, "percentage": 1.02, "elapsed_time": "0:11:05", "remaining_time": "17:57:25", "throughput": 3347.91, "total_tokens": 2228192} +{"current_steps": 1835, "total_steps": 179580, "loss": 0.5794, "lr": 5.10635928277091e-06, "epoch": 0.20436574228755985, "percentage": 1.02, "elapsed_time": "0:11:07", "remaining_time": "17:57:21", "throughput": 3347.77, "total_tokens": 2234112} +{"current_steps": 1840, "total_steps": 179580, "loss": 0.324, "lr": 5.120280654861343e-06, "epoch": 0.2049225971711772, "percentage": 1.02, "elapsed_time": "0:11:09", "remaining_time": "17:57:19", "throughput": 3347.9, "total_tokens": 2240288} +{"current_steps": 1845, "total_steps": 179580, "loss": 0.3048, "lr": 5.1342020269517765e-06, "epoch": 0.2054794520547945, "percentage": 1.03, "elapsed_time": "0:11:10", "remaining_time": "17:57:16", "throughput": 3347.9, "total_tokens": 2246336} +{"current_steps": 1850, "total_steps": 179580, "loss": 0.2549, "lr": 5.14812339904221e-06, "epoch": 0.20603630693841185, "percentage": 1.03, "elapsed_time": "0:11:12", "remaining_time": "17:57:22", "throughput": 3347.94, "total_tokens": 2252704} +{"current_steps": 1855, "total_steps": 179580, "loss": 0.3557, "lr": 5.162044771132643e-06, "epoch": 0.2065931618220292, "percentage": 1.03, "elapsed_time": "0:11:14", "remaining_time": "17:57:24", "throughput": 3347.96, "total_tokens": 2258944} +{"current_steps": 1860, "total_steps": 179580, "loss": 0.4276, "lr": 5.175966143223077e-06, "epoch": 0.2071500167056465, "percentage": 1.04, "elapsed_time": "0:11:16", "remaining_time": "17:57:01", "throughput": 3347.83, "total_tokens": 2264224} +{"current_steps": 1865, "total_steps": 179580, "loss": 0.148, "lr": 5.1898875153135095e-06, "epoch": 0.20770687158926385, "percentage": 1.04, "elapsed_time": "0:11:18", "remaining_time": "17:57:02", "throughput": 3347.93, "total_tokens": 2270464} +{"current_steps": 1870, "total_steps": 179580, "loss": 0.5185, "lr": 5.203808887403943e-06, "epoch": 0.20826372647288116, "percentage": 1.04, "elapsed_time": "0:11:19", "remaining_time": "17:56:58", "throughput": 3347.77, "total_tokens": 2276352} +{"current_steps": 1875, "total_steps": 179580, "loss": 0.3756, "lr": 5.217730259494376e-06, "epoch": 0.2088205813564985, "percentage": 1.04, "elapsed_time": "0:11:21", "remaining_time": "17:56:51", "throughput": 3347.8, "total_tokens": 2282272} +{"current_steps": 1880, "total_steps": 179580, "loss": 0.4594, "lr": 5.231651631584809e-06, "epoch": 0.20937743624011582, "percentage": 1.05, "elapsed_time": "0:11:23", "remaining_time": "17:56:53", "throughput": 3347.89, "total_tokens": 2288576} +{"current_steps": 1885, "total_steps": 179580, "loss": 0.6639, "lr": 5.245573003675243e-06, "epoch": 0.20993429112373316, "percentage": 1.05, "elapsed_time": "0:11:25", "remaining_time": "17:56:49", "throughput": 3347.8, "total_tokens": 2294528} +{"current_steps": 1890, "total_steps": 179580, "loss": 0.4249, "lr": 5.259494375765676e-06, "epoch": 0.21049114600735047, "percentage": 1.05, "elapsed_time": "0:11:27", "remaining_time": "17:56:53", "throughput": 3347.9, "total_tokens": 2300864} +{"current_steps": 1895, "total_steps": 179580, "loss": 0.3734, "lr": 5.27341574785611e-06, "epoch": 0.2110480008909678, "percentage": 1.06, "elapsed_time": "0:11:29", "remaining_time": "17:56:55", "throughput": 3347.88, "total_tokens": 2307072} +{"current_steps": 1900, "total_steps": 179580, "loss": 0.2148, "lr": 5.287337119946542e-06, "epoch": 0.21160485577458515, "percentage": 1.06, "elapsed_time": "0:11:30", "remaining_time": "17:56:49", "throughput": 3347.88, "total_tokens": 2313024} +{"current_steps": 1905, "total_steps": 179580, "loss": 0.2993, "lr": 5.301258492036976e-06, "epoch": 0.21216171065820247, "percentage": 1.06, "elapsed_time": "0:11:32", "remaining_time": "17:56:50", "throughput": 3347.83, "total_tokens": 2319200} +{"current_steps": 1910, "total_steps": 179580, "loss": 0.281, "lr": 5.315179864127408e-06, "epoch": 0.2127185655418198, "percentage": 1.06, "elapsed_time": "0:11:34", "remaining_time": "17:56:50", "throughput": 3347.79, "total_tokens": 2325312} +{"current_steps": 1915, "total_steps": 179580, "loss": 0.401, "lr": 5.329101236217842e-06, "epoch": 0.21327542042543712, "percentage": 1.07, "elapsed_time": "0:11:36", "remaining_time": "17:56:32", "throughput": 3347.77, "total_tokens": 2330784} +{"current_steps": 1920, "total_steps": 179580, "loss": 0.496, "lr": 5.343022608308275e-06, "epoch": 0.21383227530905446, "percentage": 1.07, "elapsed_time": "0:11:38", "remaining_time": "17:56:33", "throughput": 3347.76, "total_tokens": 2336992} +{"current_steps": 1925, "total_steps": 179580, "loss": 0.3068, "lr": 5.356943980398709e-06, "epoch": 0.21438913019267178, "percentage": 1.07, "elapsed_time": "0:11:39", "remaining_time": "17:56:38", "throughput": 3347.8, "total_tokens": 2343360} +{"current_steps": 1930, "total_steps": 179580, "loss": 0.4074, "lr": 5.370865352489141e-06, "epoch": 0.21494598507628912, "percentage": 1.07, "elapsed_time": "0:11:41", "remaining_time": "17:56:43", "throughput": 3347.85, "total_tokens": 2349728} +{"current_steps": 1935, "total_steps": 179580, "loss": 0.3294, "lr": 5.384786724579575e-06, "epoch": 0.21550283995990646, "percentage": 1.08, "elapsed_time": "0:11:43", "remaining_time": "17:56:40", "throughput": 3347.77, "total_tokens": 2355680} +{"current_steps": 1940, "total_steps": 179580, "loss": 0.4343, "lr": 5.398708096670008e-06, "epoch": 0.21605969484352378, "percentage": 1.08, "elapsed_time": "0:11:45", "remaining_time": "17:56:35", "throughput": 3347.61, "total_tokens": 2361568} +{"current_steps": 1945, "total_steps": 179580, "loss": 0.3027, "lr": 5.412629468760441e-06, "epoch": 0.21661654972714112, "percentage": 1.08, "elapsed_time": "0:11:47", "remaining_time": "17:56:39", "throughput": 3347.69, "total_tokens": 2367904} +{"current_steps": 1950, "total_steps": 179580, "loss": 0.2703, "lr": 5.4265508408508745e-06, "epoch": 0.21717340461075843, "percentage": 1.09, "elapsed_time": "0:11:49", "remaining_time": "17:56:48", "throughput": 3347.86, "total_tokens": 2374496} +{"current_steps": 1955, "total_steps": 179580, "loss": 0.3407, "lr": 5.440472212941308e-06, "epoch": 0.21773025949437577, "percentage": 1.09, "elapsed_time": "0:11:51", "remaining_time": "17:56:42", "throughput": 3347.83, "total_tokens": 2380416} +{"current_steps": 1960, "total_steps": 179580, "loss": 0.2759, "lr": 5.4543935850317414e-06, "epoch": 0.21828711437799309, "percentage": 1.09, "elapsed_time": "0:11:52", "remaining_time": "17:56:29", "throughput": 3347.79, "total_tokens": 2386080} +{"current_steps": 1965, "total_steps": 179580, "loss": 0.2211, "lr": 5.468314957122174e-06, "epoch": 0.21884396926161043, "percentage": 1.09, "elapsed_time": "0:11:54", "remaining_time": "17:56:33", "throughput": 3347.73, "total_tokens": 2392352} +{"current_steps": 1970, "total_steps": 179580, "loss": 0.3332, "lr": 5.4822363292126076e-06, "epoch": 0.21940082414522774, "percentage": 1.1, "elapsed_time": "0:11:56", "remaining_time": "17:56:35", "throughput": 3347.68, "total_tokens": 2398528} +{"current_steps": 1975, "total_steps": 179580, "loss": 0.1552, "lr": 5.496157701303041e-06, "epoch": 0.21995767902884508, "percentage": 1.1, "elapsed_time": "0:11:58", "remaining_time": "17:56:33", "throughput": 3347.75, "total_tokens": 2404672} +{"current_steps": 1980, "total_steps": 179580, "loss": 0.4573, "lr": 5.510079073393474e-06, "epoch": 0.22051453391246242, "percentage": 1.1, "elapsed_time": "0:12:00", "remaining_time": "17:56:33", "throughput": 3347.82, "total_tokens": 2410880} +{"current_steps": 1985, "total_steps": 179580, "loss": 0.3347, "lr": 5.524000445483907e-06, "epoch": 0.22107138879607974, "percentage": 1.11, "elapsed_time": "0:12:01", "remaining_time": "17:56:28", "throughput": 3347.85, "total_tokens": 2416864} +{"current_steps": 1990, "total_steps": 179580, "loss": 0.2228, "lr": 5.537921817574341e-06, "epoch": 0.22162824367969708, "percentage": 1.11, "elapsed_time": "0:12:03", "remaining_time": "17:56:22", "throughput": 3347.83, "total_tokens": 2422784} +{"current_steps": 1995, "total_steps": 179580, "loss": 0.2129, "lr": 5.551843189664774e-06, "epoch": 0.2221850985633144, "percentage": 1.11, "elapsed_time": "0:12:05", "remaining_time": "17:56:13", "throughput": 3347.78, "total_tokens": 2428576} +{"current_steps": 2000, "total_steps": 179580, "loss": 0.1566, "lr": 5.565764561755207e-06, "epoch": 0.22274195344693173, "percentage": 1.11, "elapsed_time": "0:12:07", "remaining_time": "17:56:11", "throughput": 3347.78, "total_tokens": 2434624} +{"current_steps": 2005, "total_steps": 179580, "loss": 0.4309, "lr": 5.57968593384564e-06, "epoch": 0.22329880833054905, "percentage": 1.12, "elapsed_time": "0:12:09", "remaining_time": "17:56:10", "throughput": 3347.78, "total_tokens": 2440768} +{"current_steps": 2010, "total_steps": 179580, "loss": 0.2892, "lr": 5.593607305936073e-06, "epoch": 0.2238556632141664, "percentage": 1.12, "elapsed_time": "0:12:10", "remaining_time": "17:56:06", "throughput": 3347.71, "total_tokens": 2446720} +{"current_steps": 2015, "total_steps": 179580, "loss": 0.3683, "lr": 5.607528678026506e-06, "epoch": 0.22441251809778373, "percentage": 1.12, "elapsed_time": "0:12:12", "remaining_time": "17:55:54", "throughput": 3347.66, "total_tokens": 2452352} +{"current_steps": 2020, "total_steps": 179580, "loss": 0.4704, "lr": 5.62145005011694e-06, "epoch": 0.22496937298140104, "percentage": 1.12, "elapsed_time": "0:12:14", "remaining_time": "17:55:56", "throughput": 3347.66, "total_tokens": 2458592} +{"current_steps": 2025, "total_steps": 179580, "loss": 0.4043, "lr": 5.635371422207373e-06, "epoch": 0.22552622786501839, "percentage": 1.13, "elapsed_time": "0:12:16", "remaining_time": "17:55:55", "throughput": 3347.84, "total_tokens": 2464832} +{"current_steps": 2030, "total_steps": 179580, "loss": 0.2002, "lr": 5.649292794297807e-06, "epoch": 0.2260830827486357, "percentage": 1.13, "elapsed_time": "0:12:18", "remaining_time": "17:56:03", "throughput": 3347.93, "total_tokens": 2471360} +{"current_steps": 2035, "total_steps": 179580, "loss": 0.3377, "lr": 5.6632141663882394e-06, "epoch": 0.22663993763225304, "percentage": 1.13, "elapsed_time": "0:12:19", "remaining_time": "17:56:00", "throughput": 3347.97, "total_tokens": 2477440} +{"current_steps": 2040, "total_steps": 179580, "loss": 0.2518, "lr": 5.677135538478673e-06, "epoch": 0.22719679251587035, "percentage": 1.14, "elapsed_time": "0:12:21", "remaining_time": "17:56:01", "throughput": 3347.92, "total_tokens": 2483616} +{"current_steps": 2045, "total_steps": 179580, "loss": 0.1658, "lr": 5.6910569105691056e-06, "epoch": 0.2277536473994877, "percentage": 1.14, "elapsed_time": "0:12:23", "remaining_time": "17:55:58", "throughput": 3347.9, "total_tokens": 2489632} +{"current_steps": 2050, "total_steps": 179580, "loss": 0.3498, "lr": 5.704978282659539e-06, "epoch": 0.228310502283105, "percentage": 1.14, "elapsed_time": "0:12:25", "remaining_time": "17:55:44", "throughput": 3347.89, "total_tokens": 2495232} +{"current_steps": 2055, "total_steps": 179580, "loss": 0.1879, "lr": 5.7188996547499725e-06, "epoch": 0.22886735716672235, "percentage": 1.14, "elapsed_time": "0:12:27", "remaining_time": "17:55:45", "throughput": 3348.05, "total_tokens": 2501568} +{"current_steps": 2060, "total_steps": 179580, "loss": 0.2731, "lr": 5.732821026840406e-06, "epoch": 0.2294242120503397, "percentage": 1.15, "elapsed_time": "0:12:28", "remaining_time": "17:55:29", "throughput": 3347.89, "total_tokens": 2506976} +{"current_steps": 2065, "total_steps": 179580, "loss": 0.2028, "lr": 5.7467423989308395e-06, "epoch": 0.229981066933957, "percentage": 1.15, "elapsed_time": "0:12:30", "remaining_time": "17:55:21", "throughput": 3347.92, "total_tokens": 2512832} +{"current_steps": 2070, "total_steps": 179580, "loss": 0.2895, "lr": 5.760663771021272e-06, "epoch": 0.23053792181757435, "percentage": 1.15, "elapsed_time": "0:12:32", "remaining_time": "17:55:26", "throughput": 3347.96, "total_tokens": 2519200} +{"current_steps": 2075, "total_steps": 179580, "loss": 0.2187, "lr": 5.774585143111706e-06, "epoch": 0.23109477670119166, "percentage": 1.16, "elapsed_time": "0:12:34", "remaining_time": "17:55:25", "throughput": 3347.96, "total_tokens": 2525344} +{"current_steps": 2080, "total_steps": 179580, "loss": 0.2337, "lr": 5.788506515202138e-06, "epoch": 0.231651631584809, "percentage": 1.16, "elapsed_time": "0:12:36", "remaining_time": "17:55:31", "throughput": 3348.01, "total_tokens": 2531744} +{"current_steps": 2085, "total_steps": 179580, "loss": 0.2034, "lr": 5.802427887292572e-06, "epoch": 0.23220848646842632, "percentage": 1.16, "elapsed_time": "0:12:37", "remaining_time": "17:55:24", "throughput": 3347.9, "total_tokens": 2537568} +{"current_steps": 2090, "total_steps": 179580, "loss": 0.2277, "lr": 5.816349259383004e-06, "epoch": 0.23276534135204366, "percentage": 1.16, "elapsed_time": "0:12:39", "remaining_time": "17:55:17", "throughput": 3347.93, "total_tokens": 2543456} +{"current_steps": 2095, "total_steps": 179580, "loss": 0.5482, "lr": 5.830270631473439e-06, "epoch": 0.233322196235661, "percentage": 1.17, "elapsed_time": "0:12:41", "remaining_time": "17:55:15", "throughput": 3348.03, "total_tokens": 2549632} +{"current_steps": 2100, "total_steps": 179580, "loss": 0.2857, "lr": 5.844192003563872e-06, "epoch": 0.23387905111927831, "percentage": 1.17, "elapsed_time": "0:12:43", "remaining_time": "17:55:17", "throughput": 3347.98, "total_tokens": 2555840} +{"current_steps": 2105, "total_steps": 179580, "loss": 0.1948, "lr": 5.858113375654305e-06, "epoch": 0.23443590600289566, "percentage": 1.17, "elapsed_time": "0:12:45", "remaining_time": "17:55:13", "throughput": 3347.95, "total_tokens": 2561792} +{"current_steps": 2110, "total_steps": 179580, "loss": 0.4464, "lr": 5.872034747744738e-06, "epoch": 0.23499276088651297, "percentage": 1.17, "elapsed_time": "0:12:46", "remaining_time": "17:55:08", "throughput": 3347.91, "total_tokens": 2567712} +{"current_steps": 2115, "total_steps": 179580, "loss": 0.2498, "lr": 5.885956119835171e-06, "epoch": 0.2355496157701303, "percentage": 1.18, "elapsed_time": "0:12:48", "remaining_time": "17:55:03", "throughput": 3347.91, "total_tokens": 2573664} +{"current_steps": 2120, "total_steps": 179580, "loss": 0.3289, "lr": 5.899877491925604e-06, "epoch": 0.23610647065374762, "percentage": 1.18, "elapsed_time": "0:12:50", "remaining_time": "17:55:09", "throughput": 3347.92, "total_tokens": 2580096} +{"current_steps": 2125, "total_steps": 179580, "loss": 0.222, "lr": 5.913798864016038e-06, "epoch": 0.23666332553736497, "percentage": 1.18, "elapsed_time": "0:12:52", "remaining_time": "17:55:15", "throughput": 3347.98, "total_tokens": 2586528} +{"current_steps": 2130, "total_steps": 179580, "loss": 0.1453, "lr": 5.927720236106471e-06, "epoch": 0.23722018042098228, "percentage": 1.19, "elapsed_time": "0:12:54", "remaining_time": "17:55:15", "throughput": 3347.99, "total_tokens": 2592704} +{"current_steps": 2135, "total_steps": 179580, "loss": 0.2377, "lr": 5.941641608196904e-06, "epoch": 0.23777703530459962, "percentage": 1.19, "elapsed_time": "0:12:56", "remaining_time": "17:55:06", "throughput": 3347.93, "total_tokens": 2598464} +{"current_steps": 2140, "total_steps": 179580, "loss": 0.156, "lr": 5.9555629802873375e-06, "epoch": 0.23833389018821696, "percentage": 1.19, "elapsed_time": "0:12:57", "remaining_time": "17:55:07", "throughput": 3347.97, "total_tokens": 2604672} +{"current_steps": 2145, "total_steps": 179580, "loss": 0.307, "lr": 5.969484352377771e-06, "epoch": 0.23889074507183428, "percentage": 1.19, "elapsed_time": "0:12:59", "remaining_time": "17:55:05", "throughput": 3347.98, "total_tokens": 2610752} +{"current_steps": 2150, "total_steps": 179580, "loss": 0.414, "lr": 5.983405724468204e-06, "epoch": 0.23944759995545162, "percentage": 1.2, "elapsed_time": "0:13:01", "remaining_time": "17:54:57", "throughput": 3348.0, "total_tokens": 2616608} +{"current_steps": 2155, "total_steps": 179580, "loss": 0.33, "lr": 5.997327096558637e-06, "epoch": 0.24000445483906893, "percentage": 1.2, "elapsed_time": "0:13:03", "remaining_time": "17:54:52", "throughput": 3348.03, "total_tokens": 2622592} +{"current_steps": 2160, "total_steps": 179580, "loss": 0.1804, "lr": 6.0112484686490705e-06, "epoch": 0.24056130972268627, "percentage": 1.2, "elapsed_time": "0:13:05", "remaining_time": "17:54:53", "throughput": 3347.91, "total_tokens": 2628704} +{"current_steps": 2165, "total_steps": 179580, "loss": 0.2862, "lr": 6.025169840739504e-06, "epoch": 0.2411181646063036, "percentage": 1.21, "elapsed_time": "0:13:06", "remaining_time": "17:54:50", "throughput": 3347.93, "total_tokens": 2634752} +{"current_steps": 2170, "total_steps": 179580, "loss": 0.4216, "lr": 6.039091212829937e-06, "epoch": 0.24167501948992093, "percentage": 1.21, "elapsed_time": "0:13:08", "remaining_time": "17:54:30", "throughput": 3347.74, "total_tokens": 2639936} +{"current_steps": 2175, "total_steps": 179580, "loss": 0.2962, "lr": 6.05301258492037e-06, "epoch": 0.24223187437353827, "percentage": 1.21, "elapsed_time": "0:13:10", "remaining_time": "17:54:29", "throughput": 3347.71, "total_tokens": 2646048} +{"current_steps": 2180, "total_steps": 179580, "loss": 0.3452, "lr": 6.066933957010804e-06, "epoch": 0.24278872925715558, "percentage": 1.21, "elapsed_time": "0:13:12", "remaining_time": "17:54:28", "throughput": 3347.66, "total_tokens": 2652128} +{"current_steps": 2185, "total_steps": 179580, "loss": 0.4808, "lr": 6.080855329101236e-06, "epoch": 0.24334558414077292, "percentage": 1.22, "elapsed_time": "0:13:14", "remaining_time": "17:54:25", "throughput": 3347.6, "total_tokens": 2658112} +{"current_steps": 2190, "total_steps": 179580, "loss": 0.3357, "lr": 6.09477670119167e-06, "epoch": 0.24390243902439024, "percentage": 1.22, "elapsed_time": "0:13:15", "remaining_time": "17:54:28", "throughput": 3347.65, "total_tokens": 2664416} +{"current_steps": 2195, "total_steps": 179580, "loss": 0.2747, "lr": 6.108698073282103e-06, "epoch": 0.24445929390800758, "percentage": 1.22, "elapsed_time": "0:13:17", "remaining_time": "17:54:30", "throughput": 3347.64, "total_tokens": 2670656} +{"current_steps": 2200, "total_steps": 179580, "loss": 0.3743, "lr": 6.122619445372537e-06, "epoch": 0.2450161487916249, "percentage": 1.23, "elapsed_time": "0:13:19", "remaining_time": "17:54:31", "throughput": 3347.56, "total_tokens": 2676800} +{"current_steps": 2205, "total_steps": 179580, "loss": 0.4194, "lr": 6.136540817462969e-06, "epoch": 0.24557300367524224, "percentage": 1.23, "elapsed_time": "0:13:21", "remaining_time": "17:54:25", "throughput": 3347.53, "total_tokens": 2682688} +{"current_steps": 2210, "total_steps": 179580, "loss": 0.224, "lr": 6.150462189553403e-06, "epoch": 0.24612985855885955, "percentage": 1.23, "elapsed_time": "0:13:23", "remaining_time": "17:54:27", "throughput": 3347.54, "total_tokens": 2688928} +{"current_steps": 2215, "total_steps": 179580, "loss": 0.3794, "lr": 6.1643835616438354e-06, "epoch": 0.2466867134424769, "percentage": 1.23, "elapsed_time": "0:13:25", "remaining_time": "17:54:22", "throughput": 3347.47, "total_tokens": 2694816} +{"current_steps": 2220, "total_steps": 179580, "loss": 0.4577, "lr": 6.178304933734269e-06, "epoch": 0.24724356832609423, "percentage": 1.24, "elapsed_time": "0:13:26", "remaining_time": "17:54:17", "throughput": 3347.39, "total_tokens": 2700704} +{"current_steps": 2225, "total_steps": 179580, "loss": 0.2409, "lr": 6.192226305824702e-06, "epoch": 0.24780042320971155, "percentage": 1.24, "elapsed_time": "0:13:28", "remaining_time": "17:54:20", "throughput": 3347.46, "total_tokens": 2707040} +{"current_steps": 2230, "total_steps": 179580, "loss": 0.4514, "lr": 6.206147677915136e-06, "epoch": 0.2483572780933289, "percentage": 1.24, "elapsed_time": "0:13:30", "remaining_time": "17:54:19", "throughput": 3347.44, "total_tokens": 2713152} +{"current_steps": 2235, "total_steps": 179580, "loss": 0.4519, "lr": 6.220069050005569e-06, "epoch": 0.2489141329769462, "percentage": 1.24, "elapsed_time": "0:13:32", "remaining_time": "17:54:21", "throughput": 3347.43, "total_tokens": 2719392} +{"current_steps": 2240, "total_steps": 179580, "loss": 0.2282, "lr": 6.233990422096002e-06, "epoch": 0.24947098786056354, "percentage": 1.25, "elapsed_time": "0:13:34", "remaining_time": "17:54:17", "throughput": 3347.48, "total_tokens": 2725408} +{"current_steps": 2245, "total_steps": 179580, "loss": 0.142, "lr": 6.2479117941864355e-06, "epoch": 0.2500278427441809, "percentage": 1.25, "elapsed_time": "0:13:35", "remaining_time": "17:54:16", "throughput": 3347.35, "total_tokens": 2731424} +{"current_steps": 2250, "total_steps": 179580, "loss": 0.3288, "lr": 6.261833166276869e-06, "epoch": 0.25058469762779817, "percentage": 1.25, "elapsed_time": "0:13:37", "remaining_time": "17:54:12", "throughput": 3347.5, "total_tokens": 2737536} +{"current_steps": 2255, "total_steps": 179580, "loss": 0.2527, "lr": 6.275754538367301e-06, "epoch": 0.2511415525114155, "percentage": 1.26, "elapsed_time": "0:13:39", "remaining_time": "17:54:15", "throughput": 3347.45, "total_tokens": 2743808} +{"current_steps": 2260, "total_steps": 179580, "loss": 0.3567, "lr": 6.289675910457734e-06, "epoch": 0.25169840739503285, "percentage": 1.26, "elapsed_time": "0:13:41", "remaining_time": "17:54:29", "throughput": 3346.7, "total_tokens": 2749952} +{"current_steps": 2265, "total_steps": 179580, "loss": 0.3048, "lr": 6.3035972825481686e-06, "epoch": 0.2522552622786502, "percentage": 1.26, "elapsed_time": "0:13:43", "remaining_time": "17:54:28", "throughput": 3346.59, "total_tokens": 2755968} +{"current_steps": 2270, "total_steps": 179580, "loss": 0.2404, "lr": 6.317518654638602e-06, "epoch": 0.25281211716226754, "percentage": 1.26, "elapsed_time": "0:13:45", "remaining_time": "17:54:32", "throughput": 3346.6, "total_tokens": 2762304} +{"current_steps": 2275, "total_steps": 179580, "loss": 0.2313, "lr": 6.3314400267290355e-06, "epoch": 0.2533689720458848, "percentage": 1.27, "elapsed_time": "0:13:47", "remaining_time": "17:54:29", "throughput": 3346.55, "total_tokens": 2768288} +{"current_steps": 2280, "total_steps": 179580, "loss": 0.2445, "lr": 6.345361398819467e-06, "epoch": 0.25392582692950216, "percentage": 1.27, "elapsed_time": "0:13:49", "remaining_time": "17:54:29", "throughput": 3346.63, "total_tokens": 2774528} +{"current_steps": 2285, "total_steps": 179580, "loss": 0.1795, "lr": 6.359282770909901e-06, "epoch": 0.2544826818131195, "percentage": 1.27, "elapsed_time": "0:13:50", "remaining_time": "17:54:27", "throughput": 3346.66, "total_tokens": 2780608} +{"current_steps": 2290, "total_steps": 179580, "loss": 0.16, "lr": 6.373204143000334e-06, "epoch": 0.25503953669673685, "percentage": 1.28, "elapsed_time": "0:13:52", "remaining_time": "17:54:30", "throughput": 3346.67, "total_tokens": 2786944} +{"current_steps": 2295, "total_steps": 179580, "loss": 0.262, "lr": 6.387125515090768e-06, "epoch": 0.25559639158035413, "percentage": 1.28, "elapsed_time": "0:13:54", "remaining_time": "17:54:30", "throughput": 3346.67, "total_tokens": 2793088} +{"current_steps": 2300, "total_steps": 179580, "loss": 0.31, "lr": 6.401046887181201e-06, "epoch": 0.2561532464639715, "percentage": 1.28, "elapsed_time": "0:13:56", "remaining_time": "17:54:30", "throughput": 3346.71, "total_tokens": 2799264} +{"current_steps": 2305, "total_steps": 179580, "loss": 0.4499, "lr": 6.414968259271634e-06, "epoch": 0.2567101013475888, "percentage": 1.28, "elapsed_time": "0:13:58", "remaining_time": "17:54:29", "throughput": 3346.7, "total_tokens": 2805376} +{"current_steps": 2310, "total_steps": 179580, "loss": 0.5246, "lr": 6.428889631362067e-06, "epoch": 0.25726695623120616, "percentage": 1.29, "elapsed_time": "0:13:59", "remaining_time": "17:54:13", "throughput": 3346.62, "total_tokens": 2810784} +{"current_steps": 2315, "total_steps": 179580, "loss": 0.4321, "lr": 6.442811003452501e-06, "epoch": 0.2578238111148235, "percentage": 1.29, "elapsed_time": "0:14:01", "remaining_time": "17:54:12", "throughput": 3346.59, "total_tokens": 2816896} +{"current_steps": 2320, "total_steps": 179580, "loss": 0.2758, "lr": 6.456732375542934e-06, "epoch": 0.2583806659984408, "percentage": 1.29, "elapsed_time": "0:14:03", "remaining_time": "17:54:18", "throughput": 3346.6, "total_tokens": 2823328} +{"current_steps": 2325, "total_steps": 179580, "loss": 0.2443, "lr": 6.470653747633366e-06, "epoch": 0.2589375208820581, "percentage": 1.29, "elapsed_time": "0:14:05", "remaining_time": "17:54:19", "throughput": 3346.57, "total_tokens": 2829504} +{"current_steps": 2330, "total_steps": 179580, "loss": 0.2656, "lr": 6.4845751197238e-06, "epoch": 0.25949437576567547, "percentage": 1.3, "elapsed_time": "0:14:07", "remaining_time": "17:54:20", "throughput": 3346.58, "total_tokens": 2835744} +{"current_steps": 2335, "total_steps": 179580, "loss": 0.3716, "lr": 6.498496491814234e-06, "epoch": 0.2600512306492928, "percentage": 1.3, "elapsed_time": "0:14:09", "remaining_time": "17:54:18", "throughput": 3346.63, "total_tokens": 2841856} +{"current_steps": 2340, "total_steps": 179580, "loss": 0.3479, "lr": 6.512417863904667e-06, "epoch": 0.26060808553291015, "percentage": 1.3, "elapsed_time": "0:14:11", "remaining_time": "17:54:19", "throughput": 3346.59, "total_tokens": 2848032} +{"current_steps": 2345, "total_steps": 179580, "loss": 0.2981, "lr": 6.526339235995101e-06, "epoch": 0.26116494041652744, "percentage": 1.31, "elapsed_time": "0:14:12", "remaining_time": "17:54:18", "throughput": 3346.6, "total_tokens": 2854176} +{"current_steps": 2350, "total_steps": 179580, "loss": 0.1601, "lr": 6.540260608085533e-06, "epoch": 0.2617217953001448, "percentage": 1.31, "elapsed_time": "0:14:14", "remaining_time": "17:54:20", "throughput": 3346.63, "total_tokens": 2860448} +{"current_steps": 2355, "total_steps": 179580, "loss": 0.4224, "lr": 6.554181980175966e-06, "epoch": 0.2622786501837621, "percentage": 1.31, "elapsed_time": "0:14:16", "remaining_time": "17:54:19", "throughput": 3346.79, "total_tokens": 2866688} +{"current_steps": 2360, "total_steps": 179580, "loss": 0.5447, "lr": 6.5681033522664e-06, "epoch": 0.26283550506737946, "percentage": 1.31, "elapsed_time": "0:14:18", "remaining_time": "17:54:21", "throughput": 3346.79, "total_tokens": 2872928} +{"current_steps": 2365, "total_steps": 179580, "loss": 0.6743, "lr": 6.582024724356833e-06, "epoch": 0.26339235995099675, "percentage": 1.32, "elapsed_time": "0:14:20", "remaining_time": "17:54:20", "throughput": 3346.85, "total_tokens": 2879136} +{"current_steps": 2370, "total_steps": 179580, "loss": 0.1885, "lr": 6.595946096447266e-06, "epoch": 0.2639492148346141, "percentage": 1.32, "elapsed_time": "0:14:22", "remaining_time": "17:54:17", "throughput": 3346.85, "total_tokens": 2885152} +{"current_steps": 2375, "total_steps": 179580, "loss": 0.2115, "lr": 6.609867468537699e-06, "epoch": 0.26450606971823143, "percentage": 1.32, "elapsed_time": "0:14:23", "remaining_time": "17:54:18", "throughput": 3346.78, "total_tokens": 2891296} +{"current_steps": 2380, "total_steps": 179580, "loss": 0.2728, "lr": 6.623788840628133e-06, "epoch": 0.26506292460184877, "percentage": 1.33, "elapsed_time": "0:14:25", "remaining_time": "17:54:22", "throughput": 3346.82, "total_tokens": 2897696} +{"current_steps": 2385, "total_steps": 179580, "loss": 0.3382, "lr": 6.637710212718566e-06, "epoch": 0.2656197794854661, "percentage": 1.33, "elapsed_time": "0:14:27", "remaining_time": "17:54:14", "throughput": 3346.78, "total_tokens": 2903456} +{"current_steps": 2390, "total_steps": 179580, "loss": 0.429, "lr": 6.651631584809e-06, "epoch": 0.2661766343690834, "percentage": 1.33, "elapsed_time": "0:14:29", "remaining_time": "17:54:13", "throughput": 3346.82, "total_tokens": 2909632} +{"current_steps": 2395, "total_steps": 179580, "loss": 0.4282, "lr": 6.6655529568994315e-06, "epoch": 0.26673348925270074, "percentage": 1.33, "elapsed_time": "0:14:31", "remaining_time": "17:54:13", "throughput": 3346.89, "total_tokens": 2915872} +{"current_steps": 2400, "total_steps": 179580, "loss": 0.4122, "lr": 6.679474328989865e-06, "epoch": 0.2672903441363181, "percentage": 1.34, "elapsed_time": "0:14:33", "remaining_time": "17:54:12", "throughput": 3346.82, "total_tokens": 2921920} +{"current_steps": 2405, "total_steps": 179580, "loss": 0.0986, "lr": 6.693395701080299e-06, "epoch": 0.2678471990199354, "percentage": 1.34, "elapsed_time": "0:14:34", "remaining_time": "17:54:19", "throughput": 3346.98, "total_tokens": 2928544} +{"current_steps": 2410, "total_steps": 179580, "loss": 0.2573, "lr": 6.707317073170733e-06, "epoch": 0.2684040539035527, "percentage": 1.34, "elapsed_time": "0:14:36", "remaining_time": "17:54:19", "throughput": 3347.0, "total_tokens": 2934720} +{"current_steps": 2415, "total_steps": 179580, "loss": 0.5394, "lr": 6.7212384452611645e-06, "epoch": 0.26896090878717005, "percentage": 1.34, "elapsed_time": "0:14:38", "remaining_time": "17:54:16", "throughput": 3347.0, "total_tokens": 2940768} +{"current_steps": 2420, "total_steps": 179580, "loss": 0.1876, "lr": 6.735159817351598e-06, "epoch": 0.2695177636707874, "percentage": 1.35, "elapsed_time": "0:14:40", "remaining_time": "17:54:14", "throughput": 3346.92, "total_tokens": 2946784} +{"current_steps": 2425, "total_steps": 179580, "loss": 0.425, "lr": 6.7490811894420315e-06, "epoch": 0.27007461855440473, "percentage": 1.35, "elapsed_time": "0:14:42", "remaining_time": "17:54:07", "throughput": 3346.93, "total_tokens": 2952640} +{"current_steps": 2430, "total_steps": 179580, "loss": 0.2493, "lr": 6.763002561532465e-06, "epoch": 0.2706314734380221, "percentage": 1.35, "elapsed_time": "0:14:43", "remaining_time": "17:54:02", "throughput": 3346.86, "total_tokens": 2958528} +{"current_steps": 2435, "total_steps": 179580, "loss": 0.232, "lr": 6.7769239336228985e-06, "epoch": 0.27118832832163936, "percentage": 1.36, "elapsed_time": "0:14:45", "remaining_time": "17:53:52", "throughput": 3346.84, "total_tokens": 2964224} +{"current_steps": 2440, "total_steps": 179580, "loss": 0.2404, "lr": 6.790845305713331e-06, "epoch": 0.2717451832052567, "percentage": 1.36, "elapsed_time": "0:14:47", "remaining_time": "17:53:56", "throughput": 3346.88, "total_tokens": 2970624} +{"current_steps": 2445, "total_steps": 179580, "loss": 0.2974, "lr": 6.804766677803765e-06, "epoch": 0.27230203808887404, "percentage": 1.36, "elapsed_time": "0:14:49", "remaining_time": "17:53:49", "throughput": 3346.92, "total_tokens": 2976512} +{"current_steps": 2450, "total_steps": 179580, "loss": 0.2187, "lr": 6.818688049894198e-06, "epoch": 0.2728588929724914, "percentage": 1.36, "elapsed_time": "0:14:51", "remaining_time": "17:53:48", "throughput": 3346.99, "total_tokens": 2982656} +{"current_steps": 2455, "total_steps": 179580, "loss": 0.3449, "lr": 6.8326094219846315e-06, "epoch": 0.27341574785610867, "percentage": 1.37, "elapsed_time": "0:14:52", "remaining_time": "17:53:45", "throughput": 3346.96, "total_tokens": 2988672} +{"current_steps": 2460, "total_steps": 179580, "loss": 0.2355, "lr": 6.846530794075065e-06, "epoch": 0.273972602739726, "percentage": 1.37, "elapsed_time": "0:14:54", "remaining_time": "17:53:42", "throughput": 3346.99, "total_tokens": 2994752} +{"current_steps": 2465, "total_steps": 179580, "loss": 0.3406, "lr": 6.860452166165497e-06, "epoch": 0.27452945762334335, "percentage": 1.37, "elapsed_time": "0:14:56", "remaining_time": "17:53:39", "throughput": 3346.98, "total_tokens": 3000768} +{"current_steps": 2470, "total_steps": 179580, "loss": 0.2966, "lr": 6.874373538255931e-06, "epoch": 0.2750863125069607, "percentage": 1.38, "elapsed_time": "0:14:58", "remaining_time": "17:53:39", "throughput": 3346.98, "total_tokens": 3006912} +{"current_steps": 2475, "total_steps": 179580, "loss": 0.3812, "lr": 6.888294910346365e-06, "epoch": 0.27564316739057804, "percentage": 1.38, "elapsed_time": "0:15:00", "remaining_time": "17:53:32", "throughput": 3347.02, "total_tokens": 3012800} +{"current_steps": 2480, "total_steps": 179580, "loss": 0.2706, "lr": 6.902216282436798e-06, "epoch": 0.2762000222741953, "percentage": 1.38, "elapsed_time": "0:15:02", "remaining_time": "17:53:33", "throughput": 3347.07, "total_tokens": 3019104} +{"current_steps": 2485, "total_steps": 179580, "loss": 0.1591, "lr": 6.91613765452723e-06, "epoch": 0.27675687715781266, "percentage": 1.38, "elapsed_time": "0:15:03", "remaining_time": "17:53:35", "throughput": 3347.15, "total_tokens": 3025440} +{"current_steps": 2490, "total_steps": 179580, "loss": 0.2215, "lr": 6.930059026617663e-06, "epoch": 0.27731373204143, "percentage": 1.39, "elapsed_time": "0:15:05", "remaining_time": "17:53:33", "throughput": 3347.08, "total_tokens": 3031456} +{"current_steps": 2495, "total_steps": 179580, "loss": 0.1187, "lr": 6.943980398708097e-06, "epoch": 0.27787058692504735, "percentage": 1.39, "elapsed_time": "0:15:07", "remaining_time": "17:53:34", "throughput": 3347.11, "total_tokens": 3037664} +{"current_steps": 2500, "total_steps": 179580, "loss": 0.1668, "lr": 6.95790177079853e-06, "epoch": 0.2784274418086647, "percentage": 1.39, "elapsed_time": "0:15:09", "remaining_time": "17:53:36", "throughput": 3347.15, "total_tokens": 3043968} +{"current_steps": 2505, "total_steps": 179580, "loss": 0.2758, "lr": 6.971823142888964e-06, "epoch": 0.278984296692282, "percentage": 1.39, "elapsed_time": "0:15:11", "remaining_time": "17:53:31", "throughput": 3347.13, "total_tokens": 3049888} +{"current_steps": 2510, "total_steps": 179580, "loss": 0.2687, "lr": 6.9857445149793965e-06, "epoch": 0.2795411515758993, "percentage": 1.4, "elapsed_time": "0:15:13", "remaining_time": "17:53:31", "throughput": 3347.13, "total_tokens": 3056096} +{"current_steps": 2515, "total_steps": 179580, "loss": 0.4114, "lr": 6.99966588706983e-06, "epoch": 0.28009800645951666, "percentage": 1.4, "elapsed_time": "0:15:14", "remaining_time": "17:53:34", "throughput": 3347.18, "total_tokens": 3062464} +{"current_steps": 2520, "total_steps": 179580, "loss": 0.2778, "lr": 7.013587259160263e-06, "epoch": 0.280654861343134, "percentage": 1.4, "elapsed_time": "0:15:16", "remaining_time": "17:53:35", "throughput": 3347.28, "total_tokens": 3068736} +{"current_steps": 2525, "total_steps": 179580, "loss": 0.3461, "lr": 7.027508631250697e-06, "epoch": 0.2812117162267513, "percentage": 1.41, "elapsed_time": "0:15:18", "remaining_time": "17:53:35", "throughput": 3347.36, "total_tokens": 3075008} +{"current_steps": 2530, "total_steps": 179580, "loss": 0.1142, "lr": 7.041430003341129e-06, "epoch": 0.2817685711103686, "percentage": 1.41, "elapsed_time": "0:15:20", "remaining_time": "17:53:34", "throughput": 3347.3, "total_tokens": 3081088} +{"current_steps": 2535, "total_steps": 179580, "loss": 0.2062, "lr": 7.055351375431562e-06, "epoch": 0.28232542599398597, "percentage": 1.41, "elapsed_time": "0:15:22", "remaining_time": "17:53:20", "throughput": 3347.14, "total_tokens": 3086432} +{"current_steps": 2540, "total_steps": 179580, "loss": 0.1361, "lr": 7.0692727475219965e-06, "epoch": 0.2828822808776033, "percentage": 1.41, "elapsed_time": "0:15:23", "remaining_time": "17:53:18", "throughput": 3347.22, "total_tokens": 3092576} +{"current_steps": 2545, "total_steps": 179580, "loss": 0.27, "lr": 7.08319411961243e-06, "epoch": 0.28343913576122065, "percentage": 1.42, "elapsed_time": "0:15:25", "remaining_time": "17:53:15", "throughput": 3347.17, "total_tokens": 3098560} +{"current_steps": 2550, "total_steps": 179580, "loss": 0.1745, "lr": 7.0971154917028635e-06, "epoch": 0.28399599064483794, "percentage": 1.42, "elapsed_time": "0:15:27", "remaining_time": "17:53:12", "throughput": 3347.22, "total_tokens": 3104672} +{"current_steps": 2555, "total_steps": 179580, "loss": 0.3052, "lr": 7.111036863793295e-06, "epoch": 0.2845528455284553, "percentage": 1.42, "elapsed_time": "0:15:29", "remaining_time": "17:53:10", "throughput": 3347.15, "total_tokens": 3110656} +{"current_steps": 2560, "total_steps": 179580, "loss": 0.2145, "lr": 7.124958235883729e-06, "epoch": 0.2851097004120726, "percentage": 1.43, "elapsed_time": "0:15:31", "remaining_time": "17:53:10", "throughput": 3347.14, "total_tokens": 3116832} +{"current_steps": 2565, "total_steps": 179580, "loss": 0.2492, "lr": 7.138879607974162e-06, "epoch": 0.28566655529568996, "percentage": 1.43, "elapsed_time": "0:15:32", "remaining_time": "17:52:54", "throughput": 3347.12, "total_tokens": 3122208} +{"current_steps": 2570, "total_steps": 179580, "loss": 0.2462, "lr": 7.152800980064596e-06, "epoch": 0.28622341017930725, "percentage": 1.43, "elapsed_time": "0:15:34", "remaining_time": "17:52:58", "throughput": 3347.21, "total_tokens": 3128672} +{"current_steps": 2575, "total_steps": 179580, "loss": 0.1866, "lr": 7.166722352155028e-06, "epoch": 0.2867802650629246, "percentage": 1.43, "elapsed_time": "0:15:36", "remaining_time": "17:52:59", "throughput": 3347.18, "total_tokens": 3134880} +{"current_steps": 2580, "total_steps": 179580, "loss": 0.2711, "lr": 7.180643724245462e-06, "epoch": 0.28733711994654193, "percentage": 1.44, "elapsed_time": "0:15:38", "remaining_time": "17:52:56", "throughput": 3347.13, "total_tokens": 3140864} +{"current_steps": 2585, "total_steps": 179580, "loss": 0.3834, "lr": 7.194565096335895e-06, "epoch": 0.28789397483015927, "percentage": 1.44, "elapsed_time": "0:15:40", "remaining_time": "17:52:51", "throughput": 3347.05, "total_tokens": 3146688} +{"current_steps": 2590, "total_steps": 179580, "loss": 0.4031, "lr": 7.208486468426329e-06, "epoch": 0.2884508297137766, "percentage": 1.44, "elapsed_time": "0:15:41", "remaining_time": "17:52:49", "throughput": 3347.12, "total_tokens": 3152832} +{"current_steps": 2595, "total_steps": 179580, "loss": 0.2274, "lr": 7.222407840516762e-06, "epoch": 0.2890076845973939, "percentage": 1.45, "elapsed_time": "0:15:43", "remaining_time": "17:52:45", "throughput": 3347.03, "total_tokens": 3158752} +{"current_steps": 2600, "total_steps": 179580, "loss": 0.36, "lr": 7.236329212607194e-06, "epoch": 0.28956453948101124, "percentage": 1.45, "elapsed_time": "0:15:45", "remaining_time": "17:52:39", "throughput": 3346.96, "total_tokens": 3164544} +{"current_steps": 2605, "total_steps": 179580, "loss": 0.1954, "lr": 7.2502505846976275e-06, "epoch": 0.2901213943646286, "percentage": 1.45, "elapsed_time": "0:15:47", "remaining_time": "17:52:39", "throughput": 3347.04, "total_tokens": 3170784} +{"current_steps": 2610, "total_steps": 179580, "loss": 0.188, "lr": 7.264171956788062e-06, "epoch": 0.2906782492482459, "percentage": 1.45, "elapsed_time": "0:15:49", "remaining_time": "17:52:34", "throughput": 3347.07, "total_tokens": 3176768} +{"current_steps": 2615, "total_steps": 179580, "loss": 0.2819, "lr": 7.278093328878495e-06, "epoch": 0.2912351041318632, "percentage": 1.46, "elapsed_time": "0:15:51", "remaining_time": "17:52:37", "throughput": 3347.06, "total_tokens": 3183072} +{"current_steps": 2620, "total_steps": 179580, "loss": 0.2872, "lr": 7.292014700968929e-06, "epoch": 0.29179195901548055, "percentage": 1.46, "elapsed_time": "0:15:52", "remaining_time": "17:52:39", "throughput": 3346.98, "total_tokens": 3189280} +{"current_steps": 2625, "total_steps": 179580, "loss": 0.1567, "lr": 7.305936073059361e-06, "epoch": 0.2923488138990979, "percentage": 1.46, "elapsed_time": "0:15:54", "remaining_time": "17:52:38", "throughput": 3347.01, "total_tokens": 3195424} +{"current_steps": 2630, "total_steps": 179580, "loss": 0.3243, "lr": 7.319857445149794e-06, "epoch": 0.29290566878271523, "percentage": 1.46, "elapsed_time": "0:15:56", "remaining_time": "17:52:37", "throughput": 3347.02, "total_tokens": 3201568} +{"current_steps": 2635, "total_steps": 179580, "loss": 0.2543, "lr": 7.3337788172402276e-06, "epoch": 0.2934625236663326, "percentage": 1.47, "elapsed_time": "0:15:58", "remaining_time": "17:52:35", "throughput": 3347.08, "total_tokens": 3207680} +{"current_steps": 2640, "total_steps": 179580, "loss": 0.3406, "lr": 7.347700189330661e-06, "epoch": 0.29401937854994986, "percentage": 1.47, "elapsed_time": "0:16:00", "remaining_time": "17:52:33", "throughput": 3347.14, "total_tokens": 3213824} +{"current_steps": 2645, "total_steps": 179580, "loss": 0.3308, "lr": 7.361621561421094e-06, "epoch": 0.2945762334335672, "percentage": 1.47, "elapsed_time": "0:16:01", "remaining_time": "17:52:31", "throughput": 3347.1, "total_tokens": 3219904} +{"current_steps": 2650, "total_steps": 179580, "loss": 0.3364, "lr": 7.375542933511527e-06, "epoch": 0.29513308831718454, "percentage": 1.48, "elapsed_time": "0:16:03", "remaining_time": "17:52:33", "throughput": 3347.17, "total_tokens": 3226240} +{"current_steps": 2655, "total_steps": 179580, "loss": 0.308, "lr": 7.389464305601961e-06, "epoch": 0.2956899432008019, "percentage": 1.48, "elapsed_time": "0:16:05", "remaining_time": "17:52:31", "throughput": 3347.24, "total_tokens": 3232352} +{"current_steps": 2660, "total_steps": 179580, "loss": 0.2424, "lr": 7.403385677692394e-06, "epoch": 0.2962467980844192, "percentage": 1.48, "elapsed_time": "0:16:07", "remaining_time": "17:52:28", "throughput": 3347.2, "total_tokens": 3238368} +{"current_steps": 2665, "total_steps": 179580, "loss": 0.5633, "lr": 7.417307049782828e-06, "epoch": 0.2968036529680365, "percentage": 1.48, "elapsed_time": "0:16:09", "remaining_time": "17:52:25", "throughput": 3347.2, "total_tokens": 3244384} +{"current_steps": 2670, "total_steps": 179580, "loss": 0.2428, "lr": 7.431228421873259e-06, "epoch": 0.29736050785165385, "percentage": 1.49, "elapsed_time": "0:16:11", "remaining_time": "17:52:27", "throughput": 3347.16, "total_tokens": 3250656} +{"current_steps": 2675, "total_steps": 179580, "loss": 0.3951, "lr": 7.445149793963693e-06, "epoch": 0.2979173627352712, "percentage": 1.49, "elapsed_time": "0:16:12", "remaining_time": "17:52:20", "throughput": 3347.14, "total_tokens": 3256416} +{"current_steps": 2680, "total_steps": 179580, "loss": 0.2854, "lr": 7.459071166054127e-06, "epoch": 0.29847421761888854, "percentage": 1.49, "elapsed_time": "0:16:14", "remaining_time": "17:52:14", "throughput": 3347.11, "total_tokens": 3262304} +{"current_steps": 2685, "total_steps": 179580, "loss": 0.2799, "lr": 7.472992538144561e-06, "epoch": 0.2990310725025058, "percentage": 1.5, "elapsed_time": "0:16:16", "remaining_time": "17:52:14", "throughput": 3347.12, "total_tokens": 3268448} +{"current_steps": 2690, "total_steps": 179580, "loss": 0.5888, "lr": 7.4869139102349925e-06, "epoch": 0.29958792738612317, "percentage": 1.5, "elapsed_time": "0:16:18", "remaining_time": "17:52:06", "throughput": 3347.03, "total_tokens": 3274144} +{"current_steps": 2695, "total_steps": 179580, "loss": 0.265, "lr": 7.500835282325426e-06, "epoch": 0.3001447822697405, "percentage": 1.5, "elapsed_time": "0:16:20", "remaining_time": "17:52:05", "throughput": 3347.03, "total_tokens": 3280288} +{"current_steps": 2700, "total_steps": 179580, "loss": 0.1398, "lr": 7.5147566544158594e-06, "epoch": 0.30070163715335785, "percentage": 1.5, "elapsed_time": "0:16:21", "remaining_time": "17:52:07", "throughput": 3347.07, "total_tokens": 3286592} +{"current_steps": 2705, "total_steps": 179580, "loss": 0.172, "lr": 7.528678026506293e-06, "epoch": 0.3012584920369752, "percentage": 1.51, "elapsed_time": "0:16:23", "remaining_time": "17:51:58", "throughput": 3346.95, "total_tokens": 3292224} +{"current_steps": 2710, "total_steps": 179580, "loss": 0.3109, "lr": 7.542599398596726e-06, "epoch": 0.3018153469205925, "percentage": 1.51, "elapsed_time": "0:16:25", "remaining_time": "17:51:55", "throughput": 3346.93, "total_tokens": 3298208} +{"current_steps": 2715, "total_steps": 179580, "loss": 0.3498, "lr": 7.556520770687159e-06, "epoch": 0.3023722018042098, "percentage": 1.51, "elapsed_time": "0:16:27", "remaining_time": "17:51:52", "throughput": 3346.94, "total_tokens": 3304256} +{"current_steps": 2720, "total_steps": 179580, "loss": 0.3067, "lr": 7.5704421427775925e-06, "epoch": 0.30292905668782716, "percentage": 1.51, "elapsed_time": "0:16:29", "remaining_time": "17:51:48", "throughput": 3346.85, "total_tokens": 3310112} +{"current_steps": 2725, "total_steps": 179580, "loss": 0.2908, "lr": 7.584363514868026e-06, "epoch": 0.3034859115714445, "percentage": 1.52, "elapsed_time": "0:16:30", "remaining_time": "17:51:48", "throughput": 3346.99, "total_tokens": 3316448} +{"current_steps": 2730, "total_steps": 179580, "loss": 0.2722, "lr": 7.5982848869584595e-06, "epoch": 0.3040427664550618, "percentage": 1.52, "elapsed_time": "0:16:32", "remaining_time": "17:51:42", "throughput": 3347.06, "total_tokens": 3322400} +{"current_steps": 2735, "total_steps": 179580, "loss": 0.3382, "lr": 7.612206259048891e-06, "epoch": 0.3045996213386791, "percentage": 1.52, "elapsed_time": "0:16:34", "remaining_time": "17:51:36", "throughput": 3347.09, "total_tokens": 3328288} +{"current_steps": 2740, "total_steps": 179580, "loss": 0.4465, "lr": 7.626127631139325e-06, "epoch": 0.30515647622229647, "percentage": 1.53, "elapsed_time": "0:16:36", "remaining_time": "17:51:34", "throughput": 3347.13, "total_tokens": 3334368} +{"current_steps": 2745, "total_steps": 179580, "loss": 0.1152, "lr": 7.640049003229759e-06, "epoch": 0.3057133311059138, "percentage": 1.53, "elapsed_time": "0:16:37", "remaining_time": "17:51:30", "throughput": 3347.06, "total_tokens": 3340288} +{"current_steps": 2750, "total_steps": 179580, "loss": 0.2432, "lr": 7.653970375320192e-06, "epoch": 0.30627018598953115, "percentage": 1.53, "elapsed_time": "0:16:39", "remaining_time": "17:51:32", "throughput": 3347.12, "total_tokens": 3346624} +{"current_steps": 2755, "total_steps": 179580, "loss": 0.2729, "lr": 7.667891747410626e-06, "epoch": 0.30682704087314844, "percentage": 1.53, "elapsed_time": "0:16:41", "remaining_time": "17:51:24", "throughput": 3347.11, "total_tokens": 3352384} +{"current_steps": 2760, "total_steps": 179580, "loss": 0.4201, "lr": 7.681813119501059e-06, "epoch": 0.3073838957567658, "percentage": 1.54, "elapsed_time": "0:16:43", "remaining_time": "17:51:21", "throughput": 3347.14, "total_tokens": 3358464} +{"current_steps": 2765, "total_steps": 179580, "loss": 0.3038, "lr": 7.695734491591491e-06, "epoch": 0.3079407506403831, "percentage": 1.54, "elapsed_time": "0:16:45", "remaining_time": "17:51:19", "throughput": 3347.17, "total_tokens": 3364544} +{"current_steps": 2770, "total_steps": 179580, "loss": 0.1337, "lr": 7.709655863681926e-06, "epoch": 0.30849760552400046, "percentage": 1.54, "elapsed_time": "0:16:47", "remaining_time": "17:51:21", "throughput": 3347.26, "total_tokens": 3370912} +{"current_steps": 2775, "total_steps": 179580, "loss": 0.2166, "lr": 7.723577235772358e-06, "epoch": 0.30905446040761775, "percentage": 1.55, "elapsed_time": "0:16:48", "remaining_time": "17:51:18", "throughput": 3347.28, "total_tokens": 3376960} +{"current_steps": 2780, "total_steps": 179580, "loss": 0.1899, "lr": 7.737498607862793e-06, "epoch": 0.3096113152912351, "percentage": 1.55, "elapsed_time": "0:16:50", "remaining_time": "17:51:20", "throughput": 3347.37, "total_tokens": 3383328} +{"current_steps": 2785, "total_steps": 179580, "loss": 0.1623, "lr": 7.751419979953224e-06, "epoch": 0.31016817017485243, "percentage": 1.55, "elapsed_time": "0:16:52", "remaining_time": "17:51:16", "throughput": 3347.41, "total_tokens": 3389376} +{"current_steps": 2790, "total_steps": 179580, "loss": 0.5435, "lr": 7.765341352043658e-06, "epoch": 0.3107250250584698, "percentage": 1.55, "elapsed_time": "0:16:54", "remaining_time": "17:51:16", "throughput": 3347.49, "total_tokens": 3395616} +{"current_steps": 2795, "total_steps": 179580, "loss": 0.3354, "lr": 7.77926272413409e-06, "epoch": 0.3112818799420871, "percentage": 1.56, "elapsed_time": "0:16:56", "remaining_time": "17:51:06", "throughput": 3347.4, "total_tokens": 3401184} +{"current_steps": 2800, "total_steps": 179580, "loss": 0.2133, "lr": 7.793184096224525e-06, "epoch": 0.3118387348257044, "percentage": 1.56, "elapsed_time": "0:16:57", "remaining_time": "17:51:10", "throughput": 3347.44, "total_tokens": 3407584} +{"current_steps": 2805, "total_steps": 179580, "loss": 0.2072, "lr": 7.807105468314957e-06, "epoch": 0.31239558970932174, "percentage": 1.56, "elapsed_time": "0:16:59", "remaining_time": "17:51:12", "throughput": 3347.55, "total_tokens": 3414016} +{"current_steps": 2810, "total_steps": 179580, "loss": 0.247, "lr": 7.82102684040539e-06, "epoch": 0.3129524445929391, "percentage": 1.56, "elapsed_time": "0:17:01", "remaining_time": "17:50:59", "throughput": 3347.5, "total_tokens": 3419424} +{"current_steps": 2815, "total_steps": 179580, "loss": 0.2684, "lr": 7.834948212495824e-06, "epoch": 0.3135092994765564, "percentage": 1.57, "elapsed_time": "0:17:03", "remaining_time": "17:50:54", "throughput": 3347.47, "total_tokens": 3425312} +{"current_steps": 2820, "total_steps": 179580, "loss": 0.1868, "lr": 7.848869584586257e-06, "epoch": 0.31406615436017377, "percentage": 1.57, "elapsed_time": "0:17:05", "remaining_time": "17:50:51", "throughput": 3347.5, "total_tokens": 3431392} +{"current_steps": 2825, "total_steps": 179580, "loss": 0.379, "lr": 7.862790956676691e-06, "epoch": 0.31462300924379105, "percentage": 1.57, "elapsed_time": "0:17:06", "remaining_time": "17:50:56", "throughput": 3347.53, "total_tokens": 3437856} +{"current_steps": 2830, "total_steps": 179580, "loss": 0.3115, "lr": 7.876712328767124e-06, "epoch": 0.3151798641274084, "percentage": 1.58, "elapsed_time": "0:17:08", "remaining_time": "17:50:56", "throughput": 3347.53, "total_tokens": 3444032} +{"current_steps": 2835, "total_steps": 179580, "loss": 0.2421, "lr": 7.890633700857557e-06, "epoch": 0.31573671901102573, "percentage": 1.58, "elapsed_time": "0:17:10", "remaining_time": "17:50:52", "throughput": 3347.64, "total_tokens": 3450112} +{"current_steps": 2840, "total_steps": 179580, "loss": 0.1707, "lr": 7.904555072947991e-06, "epoch": 0.3162935738946431, "percentage": 1.58, "elapsed_time": "0:17:12", "remaining_time": "17:50:52", "throughput": 3347.69, "total_tokens": 3456352} +{"current_steps": 2845, "total_steps": 179580, "loss": 0.4818, "lr": 7.918476445038424e-06, "epoch": 0.31685042877826036, "percentage": 1.58, "elapsed_time": "0:17:14", "remaining_time": "17:50:53", "throughput": 3347.65, "total_tokens": 3462528} +{"current_steps": 2850, "total_steps": 179580, "loss": 0.3631, "lr": 7.932397817128856e-06, "epoch": 0.3174072836618777, "percentage": 1.59, "elapsed_time": "0:17:16", "remaining_time": "17:50:53", "throughput": 3347.69, "total_tokens": 3468800} +{"current_steps": 2855, "total_steps": 179580, "loss": 0.3282, "lr": 7.946319189219289e-06, "epoch": 0.31796413854549505, "percentage": 1.59, "elapsed_time": "0:17:18", "remaining_time": "17:50:55", "throughput": 3347.67, "total_tokens": 3475040} +{"current_steps": 2860, "total_steps": 179580, "loss": 0.2156, "lr": 7.960240561309723e-06, "epoch": 0.3185209934291124, "percentage": 1.59, "elapsed_time": "0:17:19", "remaining_time": "17:50:59", "throughput": 3347.67, "total_tokens": 3481472} +{"current_steps": 2865, "total_steps": 179580, "loss": 0.3753, "lr": 7.974161933400156e-06, "epoch": 0.31907784831272973, "percentage": 1.6, "elapsed_time": "0:17:21", "remaining_time": "17:50:56", "throughput": 3347.61, "total_tokens": 3487424} +{"current_steps": 2870, "total_steps": 179580, "loss": 0.2551, "lr": 7.98808330549059e-06, "epoch": 0.319634703196347, "percentage": 1.6, "elapsed_time": "0:17:23", "remaining_time": "17:50:55", "throughput": 3347.63, "total_tokens": 3493568} +{"current_steps": 2875, "total_steps": 179580, "loss": 0.3504, "lr": 8.002004677581023e-06, "epoch": 0.32019155807996436, "percentage": 1.6, "elapsed_time": "0:17:25", "remaining_time": "17:50:53", "throughput": 3347.73, "total_tokens": 3499744} +{"current_steps": 2880, "total_steps": 179580, "loss": 0.2441, "lr": 8.015926049671455e-06, "epoch": 0.3207484129635817, "percentage": 1.6, "elapsed_time": "0:17:27", "remaining_time": "17:50:53", "throughput": 3347.81, "total_tokens": 3506016} +{"current_steps": 2885, "total_steps": 179580, "loss": 0.1696, "lr": 8.02984742176189e-06, "epoch": 0.32130526784719904, "percentage": 1.61, "elapsed_time": "0:17:29", "remaining_time": "17:50:51", "throughput": 3347.83, "total_tokens": 3512096} +{"current_steps": 2890, "total_steps": 179580, "loss": 0.4023, "lr": 8.043768793852322e-06, "epoch": 0.3218621227308163, "percentage": 1.61, "elapsed_time": "0:17:30", "remaining_time": "17:50:48", "throughput": 3347.79, "total_tokens": 3518080} +{"current_steps": 2895, "total_steps": 179580, "loss": 0.1712, "lr": 8.057690165942755e-06, "epoch": 0.32241897761443367, "percentage": 1.61, "elapsed_time": "0:17:32", "remaining_time": "17:50:45", "throughput": 3347.76, "total_tokens": 3524064} +{"current_steps": 2900, "total_steps": 179580, "loss": 0.2008, "lr": 8.07161153803319e-06, "epoch": 0.322975832498051, "percentage": 1.61, "elapsed_time": "0:17:34", "remaining_time": "17:50:41", "throughput": 3347.7, "total_tokens": 3529984} +{"current_steps": 2905, "total_steps": 179580, "loss": 0.3096, "lr": 8.085532910123622e-06, "epoch": 0.32353268738166835, "percentage": 1.62, "elapsed_time": "0:17:36", "remaining_time": "17:50:40", "throughput": 3347.72, "total_tokens": 3536128} +{"current_steps": 2910, "total_steps": 179580, "loss": 0.4592, "lr": 8.099454282214056e-06, "epoch": 0.3240895422652857, "percentage": 1.62, "elapsed_time": "0:17:38", "remaining_time": "17:50:39", "throughput": 3347.68, "total_tokens": 3542208} +{"current_steps": 2915, "total_steps": 179580, "loss": 0.468, "lr": 8.113375654304489e-06, "epoch": 0.324646397148903, "percentage": 1.62, "elapsed_time": "0:17:39", "remaining_time": "17:50:34", "throughput": 3347.6, "total_tokens": 3548032} +{"current_steps": 2920, "total_steps": 179580, "loss": 0.1414, "lr": 8.127297026394922e-06, "epoch": 0.3252032520325203, "percentage": 1.63, "elapsed_time": "0:17:41", "remaining_time": "17:50:29", "throughput": 3347.59, "total_tokens": 3553952} +{"current_steps": 2925, "total_steps": 179580, "loss": 0.3593, "lr": 8.141218398485354e-06, "epoch": 0.32576010691613766, "percentage": 1.63, "elapsed_time": "0:17:43", "remaining_time": "17:50:29", "throughput": 3347.53, "total_tokens": 3560096} +{"current_steps": 2930, "total_steps": 179580, "loss": 0.3994, "lr": 8.155139770575789e-06, "epoch": 0.326316961799755, "percentage": 1.63, "elapsed_time": "0:17:45", "remaining_time": "17:50:20", "throughput": 3347.5, "total_tokens": 3565728} +{"current_steps": 2935, "total_steps": 179580, "loss": 0.5558, "lr": 8.169061142666221e-06, "epoch": 0.3268738166833723, "percentage": 1.63, "elapsed_time": "0:17:46", "remaining_time": "17:50:17", "throughput": 3347.48, "total_tokens": 3571712} +{"current_steps": 2940, "total_steps": 179580, "loss": 0.2708, "lr": 8.182982514756654e-06, "epoch": 0.32743067156698963, "percentage": 1.64, "elapsed_time": "0:17:48", "remaining_time": "17:50:19", "throughput": 3347.47, "total_tokens": 3578016} +{"current_steps": 2945, "total_steps": 179580, "loss": 0.249, "lr": 8.196903886847088e-06, "epoch": 0.32798752645060697, "percentage": 1.64, "elapsed_time": "0:17:50", "remaining_time": "17:50:16", "throughput": 3347.58, "total_tokens": 3584128} +{"current_steps": 2950, "total_steps": 179580, "loss": 0.1339, "lr": 8.21082525893752e-06, "epoch": 0.3285443813342243, "percentage": 1.64, "elapsed_time": "0:17:52", "remaining_time": "17:50:13", "throughput": 3347.6, "total_tokens": 3590208} +{"current_steps": 2955, "total_steps": 179580, "loss": 0.5016, "lr": 8.224746631027955e-06, "epoch": 0.32910123621784165, "percentage": 1.65, "elapsed_time": "0:17:54", "remaining_time": "17:50:12", "throughput": 3347.52, "total_tokens": 3596256} +{"current_steps": 2960, "total_steps": 179580, "loss": 0.2236, "lr": 8.238668003118388e-06, "epoch": 0.32965809110145894, "percentage": 1.65, "elapsed_time": "0:17:55", "remaining_time": "17:50:03", "throughput": 3347.46, "total_tokens": 3601824} +{"current_steps": 2965, "total_steps": 179580, "loss": 0.2805, "lr": 8.25258937520882e-06, "epoch": 0.3302149459850763, "percentage": 1.65, "elapsed_time": "0:17:57", "remaining_time": "17:49:57", "throughput": 3347.42, "total_tokens": 3607648} +{"current_steps": 2970, "total_steps": 179580, "loss": 0.3487, "lr": 8.266510747299255e-06, "epoch": 0.3307718008686936, "percentage": 1.65, "elapsed_time": "0:17:59", "remaining_time": "17:49:48", "throughput": 3347.46, "total_tokens": 3613408} +{"current_steps": 2975, "total_steps": 179580, "loss": 0.2066, "lr": 8.280432119389687e-06, "epoch": 0.33132865575231096, "percentage": 1.66, "elapsed_time": "0:18:01", "remaining_time": "17:49:47", "throughput": 3347.44, "total_tokens": 3619520} +{"current_steps": 2980, "total_steps": 179580, "loss": 0.2673, "lr": 8.294353491480122e-06, "epoch": 0.3318855106359283, "percentage": 1.66, "elapsed_time": "0:18:03", "remaining_time": "17:49:42", "throughput": 3347.45, "total_tokens": 3625408} +{"current_steps": 2985, "total_steps": 179580, "loss": 0.222, "lr": 8.308274863570554e-06, "epoch": 0.3324423655195456, "percentage": 1.66, "elapsed_time": "0:18:04", "remaining_time": "17:49:42", "throughput": 3347.5, "total_tokens": 3631648} +{"current_steps": 2990, "total_steps": 179580, "loss": 0.2399, "lr": 8.322196235660987e-06, "epoch": 0.33299922040316293, "percentage": 1.66, "elapsed_time": "0:18:06", "remaining_time": "17:49:41", "throughput": 3347.52, "total_tokens": 3637792} +{"current_steps": 2995, "total_steps": 179580, "loss": 0.3932, "lr": 8.33611760775142e-06, "epoch": 0.3335560752867803, "percentage": 1.67, "elapsed_time": "0:18:08", "remaining_time": "17:49:35", "throughput": 3347.45, "total_tokens": 3643584} +{"current_steps": 3000, "total_steps": 179580, "loss": 0.3213, "lr": 8.350038979841854e-06, "epoch": 0.3341129301703976, "percentage": 1.67, "elapsed_time": "0:18:10", "remaining_time": "17:49:33", "throughput": 3347.52, "total_tokens": 3649728} +{"current_steps": 3005, "total_steps": 179580, "loss": 0.1328, "lr": 8.363960351932287e-06, "epoch": 0.3346697850540149, "percentage": 1.67, "elapsed_time": "0:18:12", "remaining_time": "17:49:32", "throughput": 3347.5, "total_tokens": 3655840} +{"current_steps": 3010, "total_steps": 179580, "loss": 0.3751, "lr": 8.37788172402272e-06, "epoch": 0.33522663993763224, "percentage": 1.68, "elapsed_time": "0:18:14", "remaining_time": "17:49:36", "throughput": 3347.58, "total_tokens": 3662304} +{"current_steps": 3015, "total_steps": 179580, "loss": 0.1231, "lr": 8.391803096113154e-06, "epoch": 0.3357834948212496, "percentage": 1.68, "elapsed_time": "0:18:15", "remaining_time": "17:49:32", "throughput": 3347.5, "total_tokens": 3668192} +{"current_steps": 3020, "total_steps": 179580, "loss": 0.2123, "lr": 8.405724468203586e-06, "epoch": 0.3363403497048669, "percentage": 1.68, "elapsed_time": "0:18:17", "remaining_time": "17:49:31", "throughput": 3347.52, "total_tokens": 3674368} +{"current_steps": 3025, "total_steps": 179580, "loss": 0.4288, "lr": 8.41964584029402e-06, "epoch": 0.33689720458848427, "percentage": 1.68, "elapsed_time": "0:18:19", "remaining_time": "17:49:29", "throughput": 3347.45, "total_tokens": 3680352} +{"current_steps": 3030, "total_steps": 179580, "loss": 0.1718, "lr": 8.433567212384453e-06, "epoch": 0.33745405947210155, "percentage": 1.69, "elapsed_time": "0:18:21", "remaining_time": "17:49:27", "throughput": 3347.48, "total_tokens": 3686464} +{"current_steps": 3035, "total_steps": 179580, "loss": 0.3923, "lr": 8.447488584474886e-06, "epoch": 0.3380109143557189, "percentage": 1.69, "elapsed_time": "0:18:23", "remaining_time": "17:49:27", "throughput": 3347.49, "total_tokens": 3692640} +{"current_steps": 3040, "total_steps": 179580, "loss": 0.4503, "lr": 8.46140995656532e-06, "epoch": 0.33856776923933624, "percentage": 1.69, "elapsed_time": "0:18:24", "remaining_time": "17:49:16", "throughput": 3347.37, "total_tokens": 3698048} +{"current_steps": 3045, "total_steps": 179580, "loss": 0.1652, "lr": 8.475331328655753e-06, "epoch": 0.3391246241229536, "percentage": 1.7, "elapsed_time": "0:18:26", "remaining_time": "17:49:13", "throughput": 3347.4, "total_tokens": 3704128} +{"current_steps": 3050, "total_steps": 179580, "loss": 0.3817, "lr": 8.489252700746187e-06, "epoch": 0.33968147900657086, "percentage": 1.7, "elapsed_time": "0:18:28", "remaining_time": "17:49:18", "throughput": 3347.47, "total_tokens": 3710688} +{"current_steps": 3055, "total_steps": 179580, "loss": 0.4675, "lr": 8.503174072836618e-06, "epoch": 0.3402383338901882, "percentage": 1.7, "elapsed_time": "0:18:30", "remaining_time": "17:49:16", "throughput": 3347.47, "total_tokens": 3716736} +{"current_steps": 3060, "total_steps": 179580, "loss": 0.3691, "lr": 8.517095444927052e-06, "epoch": 0.34079518877380555, "percentage": 1.7, "elapsed_time": "0:18:32", "remaining_time": "17:49:10", "throughput": 3347.4, "total_tokens": 3722496} +{"current_steps": 3065, "total_steps": 179580, "loss": 0.298, "lr": 8.531016817017485e-06, "epoch": 0.3413520436574229, "percentage": 1.71, "elapsed_time": "0:18:33", "remaining_time": "17:49:09", "throughput": 3347.38, "total_tokens": 3728608} +{"current_steps": 3070, "total_steps": 179580, "loss": 0.1788, "lr": 8.54493818910792e-06, "epoch": 0.34190889854104023, "percentage": 1.71, "elapsed_time": "0:18:35", "remaining_time": "17:49:07", "throughput": 3347.4, "total_tokens": 3734688} +{"current_steps": 3075, "total_steps": 179580, "loss": 0.2933, "lr": 8.558859561198352e-06, "epoch": 0.3424657534246575, "percentage": 1.71, "elapsed_time": "0:18:37", "remaining_time": "17:49:10", "throughput": 3347.41, "total_tokens": 3741056} +{"current_steps": 3080, "total_steps": 179580, "loss": 0.1969, "lr": 8.572780933288785e-06, "epoch": 0.34302260830827486, "percentage": 1.72, "elapsed_time": "0:18:39", "remaining_time": "17:49:10", "throughput": 3347.33, "total_tokens": 3747168} +{"current_steps": 3085, "total_steps": 179580, "loss": 0.2419, "lr": 8.586702305379219e-06, "epoch": 0.3435794631918922, "percentage": 1.72, "elapsed_time": "0:18:41", "remaining_time": "17:49:11", "throughput": 3347.34, "total_tokens": 3753440} +{"current_steps": 3090, "total_steps": 179580, "loss": 0.193, "lr": 8.600623677469651e-06, "epoch": 0.34413631807550954, "percentage": 1.72, "elapsed_time": "0:18:43", "remaining_time": "17:49:11", "throughput": 3347.28, "total_tokens": 3759584} +{"current_steps": 3095, "total_steps": 179580, "loss": 0.1318, "lr": 8.614545049560086e-06, "epoch": 0.3446931729591268, "percentage": 1.72, "elapsed_time": "0:18:45", "remaining_time": "17:49:13", "throughput": 3347.29, "total_tokens": 3765856} +{"current_steps": 3100, "total_steps": 179580, "loss": 0.451, "lr": 8.628466421650517e-06, "epoch": 0.34525002784274417, "percentage": 1.73, "elapsed_time": "0:18:46", "remaining_time": "17:49:14", "throughput": 3347.37, "total_tokens": 3772224} +{"current_steps": 3105, "total_steps": 179580, "loss": 0.3598, "lr": 8.642387793740951e-06, "epoch": 0.3458068827263615, "percentage": 1.73, "elapsed_time": "0:18:48", "remaining_time": "17:49:15", "throughput": 3347.31, "total_tokens": 3778400} +{"current_steps": 3110, "total_steps": 179580, "loss": 0.1356, "lr": 8.656309165831385e-06, "epoch": 0.34636373760997885, "percentage": 1.73, "elapsed_time": "0:18:50", "remaining_time": "17:49:16", "throughput": 3347.29, "total_tokens": 3784608} +{"current_steps": 3115, "total_steps": 179580, "loss": 0.1591, "lr": 8.670230537921818e-06, "epoch": 0.3469205924935962, "percentage": 1.73, "elapsed_time": "0:18:52", "remaining_time": "17:49:13", "throughput": 3347.3, "total_tokens": 3790688} +{"current_steps": 3120, "total_steps": 179580, "loss": 0.2666, "lr": 8.684151910012252e-06, "epoch": 0.3474774473772135, "percentage": 1.74, "elapsed_time": "0:18:54", "remaining_time": "17:49:13", "throughput": 3347.31, "total_tokens": 3796864} +{"current_steps": 3125, "total_steps": 179580, "loss": 0.343, "lr": 8.698073282102683e-06, "epoch": 0.3480343022608308, "percentage": 1.74, "elapsed_time": "0:18:56", "remaining_time": "17:49:13", "throughput": 3347.3, "total_tokens": 3803008} +{"current_steps": 3130, "total_steps": 179580, "loss": 0.2344, "lr": 8.711994654193118e-06, "epoch": 0.34859115714444816, "percentage": 1.74, "elapsed_time": "0:18:57", "remaining_time": "17:49:11", "throughput": 3347.31, "total_tokens": 3809152} +{"current_steps": 3135, "total_steps": 179580, "loss": 0.2363, "lr": 8.72591602628355e-06, "epoch": 0.3491480120280655, "percentage": 1.75, "elapsed_time": "0:18:59", "remaining_time": "17:49:10", "throughput": 3347.33, "total_tokens": 3815296} +{"current_steps": 3140, "total_steps": 179580, "loss": 0.1991, "lr": 8.739837398373985e-06, "epoch": 0.3497048669116828, "percentage": 1.75, "elapsed_time": "0:19:01", "remaining_time": "17:49:08", "throughput": 3347.31, "total_tokens": 3821312} +{"current_steps": 3145, "total_steps": 179580, "loss": 0.1545, "lr": 8.753758770464417e-06, "epoch": 0.35026172179530013, "percentage": 1.75, "elapsed_time": "0:19:03", "remaining_time": "17:49:05", "throughput": 3347.29, "total_tokens": 3827328} +{"current_steps": 3150, "total_steps": 179580, "loss": 0.2242, "lr": 8.76768014255485e-06, "epoch": 0.35081857667891747, "percentage": 1.75, "elapsed_time": "0:19:05", "remaining_time": "17:49:02", "throughput": 3347.25, "total_tokens": 3833312} +{"current_steps": 3155, "total_steps": 179580, "loss": 0.2047, "lr": 8.781601514645284e-06, "epoch": 0.3513754315625348, "percentage": 1.76, "elapsed_time": "0:19:07", "remaining_time": "17:49:01", "throughput": 3347.3, "total_tokens": 3839456} +{"current_steps": 3160, "total_steps": 179580, "loss": 0.1833, "lr": 8.795522886735717e-06, "epoch": 0.35193228644615215, "percentage": 1.76, "elapsed_time": "0:19:08", "remaining_time": "17:49:00", "throughput": 3347.27, "total_tokens": 3845568} +{"current_steps": 3165, "total_steps": 179580, "loss": 0.2448, "lr": 8.809444258826151e-06, "epoch": 0.35248914132976944, "percentage": 1.76, "elapsed_time": "0:19:10", "remaining_time": "17:48:58", "throughput": 3347.29, "total_tokens": 3851680} +{"current_steps": 3170, "total_steps": 179580, "loss": 0.255, "lr": 8.823365630916584e-06, "epoch": 0.3530459962133868, "percentage": 1.77, "elapsed_time": "0:19:12", "remaining_time": "17:49:00", "throughput": 3347.42, "total_tokens": 3858144} +{"current_steps": 3175, "total_steps": 179580, "loss": 0.2324, "lr": 8.837287003007016e-06, "epoch": 0.3536028510970041, "percentage": 1.77, "elapsed_time": "0:19:14", "remaining_time": "17:48:56", "throughput": 3347.43, "total_tokens": 3864128} +{"current_steps": 3180, "total_steps": 179580, "loss": 0.5013, "lr": 8.85120837509745e-06, "epoch": 0.35415970598062146, "percentage": 1.77, "elapsed_time": "0:19:16", "remaining_time": "17:48:59", "throughput": 3347.47, "total_tokens": 3870528} +{"current_steps": 3185, "total_steps": 179580, "loss": 0.1702, "lr": 8.865129747187883e-06, "epoch": 0.3547165608642388, "percentage": 1.77, "elapsed_time": "0:19:18", "remaining_time": "17:48:58", "throughput": 3347.45, "total_tokens": 3876640} +{"current_steps": 3190, "total_steps": 179580, "loss": 0.3162, "lr": 8.879051119278318e-06, "epoch": 0.3552734157478561, "percentage": 1.78, "elapsed_time": "0:19:19", "remaining_time": "17:48:55", "throughput": 3347.44, "total_tokens": 3882656} +{"current_steps": 3195, "total_steps": 179580, "loss": 0.2349, "lr": 8.892972491368749e-06, "epoch": 0.35583027063147343, "percentage": 1.78, "elapsed_time": "0:19:21", "remaining_time": "17:48:51", "throughput": 3347.37, "total_tokens": 3888544} +{"current_steps": 3200, "total_steps": 179580, "loss": 0.4129, "lr": 8.906893863459183e-06, "epoch": 0.3563871255150908, "percentage": 1.78, "elapsed_time": "0:19:23", "remaining_time": "17:48:51", "throughput": 3347.39, "total_tokens": 3894720} +{"current_steps": 3205, "total_steps": 179580, "loss": 0.222, "lr": 8.920815235549616e-06, "epoch": 0.3569439803987081, "percentage": 1.78, "elapsed_time": "0:19:25", "remaining_time": "17:48:51", "throughput": 3347.38, "total_tokens": 3900928} +{"current_steps": 3210, "total_steps": 179580, "loss": 0.2121, "lr": 8.93473660764005e-06, "epoch": 0.3575008352823254, "percentage": 1.79, "elapsed_time": "0:19:27", "remaining_time": "17:48:49", "throughput": 3347.41, "total_tokens": 3907008} +{"current_steps": 3215, "total_steps": 179580, "loss": 0.0736, "lr": 8.948657979730483e-06, "epoch": 0.35805769016594274, "percentage": 1.79, "elapsed_time": "0:19:28", "remaining_time": "17:48:44", "throughput": 3347.41, "total_tokens": 3912896} +{"current_steps": 3220, "total_steps": 179580, "loss": 0.3034, "lr": 8.962579351820915e-06, "epoch": 0.3586145450495601, "percentage": 1.79, "elapsed_time": "0:19:30", "remaining_time": "17:48:41", "throughput": 3347.35, "total_tokens": 3918848} +{"current_steps": 3225, "total_steps": 179580, "loss": 0.1483, "lr": 8.97650072391135e-06, "epoch": 0.3591713999331774, "percentage": 1.8, "elapsed_time": "0:19:32", "remaining_time": "17:48:37", "throughput": 3347.36, "total_tokens": 3924832} +{"current_steps": 3230, "total_steps": 179580, "loss": 0.1182, "lr": 8.990422096001782e-06, "epoch": 0.35972825481679477, "percentage": 1.8, "elapsed_time": "0:19:34", "remaining_time": "17:48:40", "throughput": 3347.4, "total_tokens": 3931232} +{"current_steps": 3235, "total_steps": 179580, "loss": 0.3291, "lr": 9.004343468092217e-06, "epoch": 0.36028510970041205, "percentage": 1.8, "elapsed_time": "0:19:36", "remaining_time": "17:48:39", "throughput": 3347.45, "total_tokens": 3937472} +{"current_steps": 3240, "total_steps": 179580, "loss": 0.3421, "lr": 9.01826484018265e-06, "epoch": 0.3608419645840294, "percentage": 1.8, "elapsed_time": "0:19:38", "remaining_time": "17:48:38", "throughput": 3347.41, "total_tokens": 3943552} +{"current_steps": 3245, "total_steps": 179580, "loss": 0.1619, "lr": 9.032186212273082e-06, "epoch": 0.36139881946764674, "percentage": 1.81, "elapsed_time": "0:19:39", "remaining_time": "17:48:38", "throughput": 3347.43, "total_tokens": 3949760} +{"current_steps": 3250, "total_steps": 179580, "loss": 0.2848, "lr": 9.046107584363516e-06, "epoch": 0.3619556743512641, "percentage": 1.81, "elapsed_time": "0:19:41", "remaining_time": "17:48:43", "throughput": 3347.46, "total_tokens": 3956320} +{"current_steps": 3255, "total_steps": 179580, "loss": 0.4252, "lr": 9.060028956453949e-06, "epoch": 0.36251252923488136, "percentage": 1.81, "elapsed_time": "0:19:43", "remaining_time": "17:48:42", "throughput": 3347.43, "total_tokens": 3962400} +{"current_steps": 3260, "total_steps": 179580, "loss": 0.206, "lr": 9.073950328544381e-06, "epoch": 0.3630693841184987, "percentage": 1.82, "elapsed_time": "0:19:45", "remaining_time": "17:48:39", "throughput": 3347.43, "total_tokens": 3968448} +{"current_steps": 3265, "total_steps": 179580, "loss": 0.1139, "lr": 9.087871700634814e-06, "epoch": 0.36362623900211605, "percentage": 1.82, "elapsed_time": "0:19:47", "remaining_time": "17:48:39", "throughput": 3347.5, "total_tokens": 3974720} +{"current_steps": 3270, "total_steps": 179580, "loss": 0.2482, "lr": 9.101793072725248e-06, "epoch": 0.3641830938857334, "percentage": 1.82, "elapsed_time": "0:19:49", "remaining_time": "17:48:35", "throughput": 3347.43, "total_tokens": 3980576} +{"current_steps": 3275, "total_steps": 179580, "loss": 0.1673, "lr": 9.115714444815681e-06, "epoch": 0.36473994876935073, "percentage": 1.82, "elapsed_time": "0:19:50", "remaining_time": "17:48:26", "throughput": 3347.49, "total_tokens": 3986272} +{"current_steps": 3280, "total_steps": 179580, "loss": 0.2197, "lr": 9.129635816906115e-06, "epoch": 0.365296803652968, "percentage": 1.83, "elapsed_time": "0:19:52", "remaining_time": "17:48:25", "throughput": 3347.52, "total_tokens": 3992480} +{"current_steps": 3285, "total_steps": 179580, "loss": 0.2888, "lr": 9.143557188996548e-06, "epoch": 0.36585365853658536, "percentage": 1.83, "elapsed_time": "0:19:54", "remaining_time": "17:48:19", "throughput": 3347.49, "total_tokens": 3998240} +{"current_steps": 3290, "total_steps": 179580, "loss": 0.2409, "lr": 9.15747856108698e-06, "epoch": 0.3664105134202027, "percentage": 1.83, "elapsed_time": "0:19:56", "remaining_time": "17:48:15", "throughput": 3347.49, "total_tokens": 4004160} +{"current_steps": 3295, "total_steps": 179580, "loss": 0.2156, "lr": 9.171399933177415e-06, "epoch": 0.36696736830382004, "percentage": 1.83, "elapsed_time": "0:19:57", "remaining_time": "17:48:08", "throughput": 3347.45, "total_tokens": 4009920} +{"current_steps": 3300, "total_steps": 179580, "loss": 0.5073, "lr": 9.185321305267848e-06, "epoch": 0.3675242231874373, "percentage": 1.84, "elapsed_time": "0:19:59", "remaining_time": "17:47:59", "throughput": 3347.28, "total_tokens": 4015328} +{"current_steps": 3305, "total_steps": 179580, "loss": 0.2822, "lr": 9.199242677358282e-06, "epoch": 0.36808107807105467, "percentage": 1.84, "elapsed_time": "0:20:01", "remaining_time": "17:47:56", "throughput": 3347.21, "total_tokens": 4021280} +{"current_steps": 3310, "total_steps": 179580, "loss": 0.3274, "lr": 9.213164049448715e-06, "epoch": 0.368637932954672, "percentage": 1.84, "elapsed_time": "0:20:03", "remaining_time": "17:47:54", "throughput": 3347.24, "total_tokens": 4027392} +{"current_steps": 3315, "total_steps": 179580, "loss": 0.2438, "lr": 9.227085421539147e-06, "epoch": 0.36919478783828935, "percentage": 1.85, "elapsed_time": "0:20:05", "remaining_time": "17:47:55", "throughput": 3347.27, "total_tokens": 4033664} +{"current_steps": 3320, "total_steps": 179580, "loss": 0.5064, "lr": 9.241006793629581e-06, "epoch": 0.3697516427219067, "percentage": 1.85, "elapsed_time": "0:20:06", "remaining_time": "17:47:50", "throughput": 3347.18, "total_tokens": 4039424} +{"current_steps": 3325, "total_steps": 179580, "loss": 0.2136, "lr": 9.254928165720014e-06, "epoch": 0.370308497605524, "percentage": 1.85, "elapsed_time": "0:20:08", "remaining_time": "17:47:48", "throughput": 3347.26, "total_tokens": 4045600} +{"current_steps": 3330, "total_steps": 179580, "loss": 0.2004, "lr": 9.268849537810447e-06, "epoch": 0.3708653524891413, "percentage": 1.85, "elapsed_time": "0:20:10", "remaining_time": "17:47:43", "throughput": 3347.22, "total_tokens": 4051456} +{"current_steps": 3335, "total_steps": 179580, "loss": 0.2892, "lr": 9.28277090990088e-06, "epoch": 0.37142220737275866, "percentage": 1.86, "elapsed_time": "0:20:12", "remaining_time": "17:47:42", "throughput": 3347.31, "total_tokens": 4057664} +{"current_steps": 3340, "total_steps": 179580, "loss": 0.2791, "lr": 9.296692281991314e-06, "epoch": 0.371979062256376, "percentage": 1.86, "elapsed_time": "0:20:14", "remaining_time": "17:47:41", "throughput": 3347.39, "total_tokens": 4063936} +{"current_steps": 3345, "total_steps": 179580, "loss": 0.3732, "lr": 9.310613654081746e-06, "epoch": 0.37253591713999334, "percentage": 1.86, "elapsed_time": "0:20:15", "remaining_time": "17:47:39", "throughput": 3347.47, "total_tokens": 4070112} +{"current_steps": 3350, "total_steps": 179580, "loss": 0.2903, "lr": 9.32453502617218e-06, "epoch": 0.37309277202361063, "percentage": 1.87, "elapsed_time": "0:20:17", "remaining_time": "17:47:39", "throughput": 3347.52, "total_tokens": 4076320} +{"current_steps": 3355, "total_steps": 179580, "loss": 0.2686, "lr": 9.338456398262613e-06, "epoch": 0.37364962690722797, "percentage": 1.87, "elapsed_time": "0:20:19", "remaining_time": "17:47:37", "throughput": 3347.51, "total_tokens": 4082432} +{"current_steps": 3360, "total_steps": 179580, "loss": 0.3095, "lr": 9.352377770353046e-06, "epoch": 0.3742064817908453, "percentage": 1.87, "elapsed_time": "0:20:21", "remaining_time": "17:47:31", "throughput": 3347.51, "total_tokens": 4088224} +{"current_steps": 3365, "total_steps": 179580, "loss": 0.3495, "lr": 9.36629914244348e-06, "epoch": 0.37476333667446265, "percentage": 1.87, "elapsed_time": "0:20:23", "remaining_time": "17:47:27", "throughput": 3347.53, "total_tokens": 4094208} +{"current_steps": 3370, "total_steps": 179580, "loss": 0.273, "lr": 9.380220514533913e-06, "epoch": 0.37532019155807994, "percentage": 1.88, "elapsed_time": "0:20:24", "remaining_time": "17:47:30", "throughput": 3347.63, "total_tokens": 4100736} +{"current_steps": 3375, "total_steps": 179580, "loss": 0.3134, "lr": 9.394141886624346e-06, "epoch": 0.3758770464416973, "percentage": 1.88, "elapsed_time": "0:20:26", "remaining_time": "17:47:32", "throughput": 3347.63, "total_tokens": 4107072} +{"current_steps": 3380, "total_steps": 179580, "loss": 0.28, "lr": 9.40806325871478e-06, "epoch": 0.3764339013253146, "percentage": 1.88, "elapsed_time": "0:20:28", "remaining_time": "17:47:31", "throughput": 3347.61, "total_tokens": 4113184} +{"current_steps": 3385, "total_steps": 179580, "loss": 0.2292, "lr": 9.421984630805212e-06, "epoch": 0.37699075620893197, "percentage": 1.88, "elapsed_time": "0:20:30", "remaining_time": "17:47:32", "throughput": 3347.69, "total_tokens": 4119488} +{"current_steps": 3390, "total_steps": 179580, "loss": 0.3668, "lr": 9.435906002895647e-06, "epoch": 0.3775476110925493, "percentage": 1.89, "elapsed_time": "0:20:32", "remaining_time": "17:47:32", "throughput": 3347.71, "total_tokens": 4125760} +{"current_steps": 3395, "total_steps": 179580, "loss": 0.2175, "lr": 9.44982737498608e-06, "epoch": 0.3781044659761666, "percentage": 1.89, "elapsed_time": "0:20:34", "remaining_time": "17:47:33", "throughput": 3347.74, "total_tokens": 4132064} +{"current_steps": 3400, "total_steps": 179580, "loss": 0.2412, "lr": 9.463748747076512e-06, "epoch": 0.37866132085978393, "percentage": 1.89, "elapsed_time": "0:20:35", "remaining_time": "17:47:21", "throughput": 3347.72, "total_tokens": 4137440} +{"current_steps": 3405, "total_steps": 179580, "loss": 0.1771, "lr": 9.477670119166945e-06, "epoch": 0.3792181757434013, "percentage": 1.9, "elapsed_time": "0:20:37", "remaining_time": "17:47:17", "throughput": 3347.73, "total_tokens": 4143392} +{"current_steps": 3410, "total_steps": 179580, "loss": 0.1547, "lr": 9.491591491257379e-06, "epoch": 0.3797750306270186, "percentage": 1.9, "elapsed_time": "0:20:39", "remaining_time": "17:47:15", "throughput": 3347.84, "total_tokens": 4149632} +{"current_steps": 3415, "total_steps": 179580, "loss": 0.3364, "lr": 9.505512863347812e-06, "epoch": 0.3803318855106359, "percentage": 1.9, "elapsed_time": "0:20:41", "remaining_time": "17:47:19", "throughput": 3347.85, "total_tokens": 4156096} +{"current_steps": 3420, "total_steps": 179580, "loss": 0.207, "lr": 9.519434235438244e-06, "epoch": 0.38088874039425324, "percentage": 1.9, "elapsed_time": "0:20:43", "remaining_time": "17:47:19", "throughput": 3347.87, "total_tokens": 4162336} +{"current_steps": 3425, "total_steps": 179580, "loss": 0.4118, "lr": 9.533355607528679e-06, "epoch": 0.3814455952778706, "percentage": 1.91, "elapsed_time": "0:20:45", "remaining_time": "17:47:20", "throughput": 3347.86, "total_tokens": 4168544} +{"current_steps": 3430, "total_steps": 179580, "loss": 0.2629, "lr": 9.547276979619111e-06, "epoch": 0.3820024501614879, "percentage": 1.91, "elapsed_time": "0:20:46", "remaining_time": "17:47:20", "throughput": 3347.84, "total_tokens": 4174752} +{"current_steps": 3435, "total_steps": 179580, "loss": 0.2597, "lr": 9.561198351709546e-06, "epoch": 0.38255930504510527, "percentage": 1.91, "elapsed_time": "0:20:48", "remaining_time": "17:47:14", "throughput": 3347.83, "total_tokens": 4180576} +{"current_steps": 3440, "total_steps": 179580, "loss": 0.2889, "lr": 9.575119723799978e-06, "epoch": 0.38311615992872255, "percentage": 1.92, "elapsed_time": "0:20:50", "remaining_time": "17:47:13", "throughput": 3347.81, "total_tokens": 4186688} +{"current_steps": 3445, "total_steps": 179580, "loss": 0.1541, "lr": 9.589041095890411e-06, "epoch": 0.3836730148123399, "percentage": 1.92, "elapsed_time": "0:20:52", "remaining_time": "17:47:05", "throughput": 3347.76, "total_tokens": 4192320} +{"current_steps": 3450, "total_steps": 179580, "loss": 0.3386, "lr": 9.602962467980845e-06, "epoch": 0.38422986969595724, "percentage": 1.92, "elapsed_time": "0:20:54", "remaining_time": "17:47:03", "throughput": 3347.81, "total_tokens": 4198432} +{"current_steps": 3455, "total_steps": 179580, "loss": 0.2001, "lr": 9.616883840071278e-06, "epoch": 0.3847867245795746, "percentage": 1.92, "elapsed_time": "0:20:55", "remaining_time": "17:47:05", "throughput": 3347.79, "total_tokens": 4204736} +{"current_steps": 3460, "total_steps": 179580, "loss": 0.1673, "lr": 9.630805212161712e-06, "epoch": 0.38534357946319187, "percentage": 1.93, "elapsed_time": "0:20:57", "remaining_time": "17:47:01", "throughput": 3347.75, "total_tokens": 4210624} +{"current_steps": 3465, "total_steps": 179580, "loss": 0.4365, "lr": 9.644726584252145e-06, "epoch": 0.3859004343468092, "percentage": 1.93, "elapsed_time": "0:20:59", "remaining_time": "17:46:55", "throughput": 3347.69, "total_tokens": 4216352} +{"current_steps": 3470, "total_steps": 179580, "loss": 0.4055, "lr": 9.658647956342577e-06, "epoch": 0.38645728923042655, "percentage": 1.93, "elapsed_time": "0:21:01", "remaining_time": "17:46:54", "throughput": 3347.67, "total_tokens": 4222464} +{"current_steps": 3475, "total_steps": 179580, "loss": 0.3179, "lr": 9.67256932843301e-06, "epoch": 0.3870141441140439, "percentage": 1.94, "elapsed_time": "0:21:03", "remaining_time": "17:46:54", "throughput": 3347.75, "total_tokens": 4228768} +{"current_steps": 3480, "total_steps": 179580, "loss": 0.3242, "lr": 9.686490700523444e-06, "epoch": 0.38757099899766123, "percentage": 1.94, "elapsed_time": "0:21:05", "remaining_time": "17:46:55", "throughput": 3347.77, "total_tokens": 4235040} +{"current_steps": 3485, "total_steps": 179580, "loss": 0.3308, "lr": 9.700412072613877e-06, "epoch": 0.3881278538812785, "percentage": 1.94, "elapsed_time": "0:21:06", "remaining_time": "17:46:55", "throughput": 3347.79, "total_tokens": 4241312} +{"current_steps": 3490, "total_steps": 179580, "loss": 0.2245, "lr": 9.71433344470431e-06, "epoch": 0.38868470876489586, "percentage": 1.94, "elapsed_time": "0:21:08", "remaining_time": "17:46:57", "throughput": 3347.8, "total_tokens": 4247648} +{"current_steps": 3495, "total_steps": 179580, "loss": 0.4676, "lr": 9.728254816794744e-06, "epoch": 0.3892415636485132, "percentage": 1.95, "elapsed_time": "0:21:10", "remaining_time": "17:46:53", "throughput": 3347.84, "total_tokens": 4253664} +{"current_steps": 3500, "total_steps": 179580, "loss": 0.4109, "lr": 9.742176188885177e-06, "epoch": 0.38979841853213054, "percentage": 1.95, "elapsed_time": "0:21:12", "remaining_time": "17:46:54", "throughput": 3347.8, "total_tokens": 4259840} +{"current_steps": 3505, "total_steps": 179580, "loss": 0.2555, "lr": 9.756097560975611e-06, "epoch": 0.3903552734157479, "percentage": 1.95, "elapsed_time": "0:21:14", "remaining_time": "17:46:49", "throughput": 3347.75, "total_tokens": 4265696} +{"current_steps": 3510, "total_steps": 179580, "loss": 0.2892, "lr": 9.770018933066044e-06, "epoch": 0.39091212829936517, "percentage": 1.95, "elapsed_time": "0:21:15", "remaining_time": "17:46:44", "throughput": 3347.74, "total_tokens": 4271520} +{"current_steps": 3515, "total_steps": 179580, "loss": 0.3615, "lr": 9.783940305156476e-06, "epoch": 0.3914689831829825, "percentage": 1.96, "elapsed_time": "0:21:17", "remaining_time": "17:46:44", "throughput": 3347.76, "total_tokens": 4277792} +{"current_steps": 3520, "total_steps": 179580, "loss": 0.1515, "lr": 9.79786167724691e-06, "epoch": 0.39202583806659985, "percentage": 1.96, "elapsed_time": "0:21:19", "remaining_time": "17:46:45", "throughput": 3347.87, "total_tokens": 4284160} +{"current_steps": 3525, "total_steps": 179580, "loss": 0.3245, "lr": 9.811783049337343e-06, "epoch": 0.3925826929502172, "percentage": 1.96, "elapsed_time": "0:21:21", "remaining_time": "17:46:39", "throughput": 3347.85, "total_tokens": 4289952} +{"current_steps": 3530, "total_steps": 179580, "loss": 0.2043, "lr": 9.825704421427778e-06, "epoch": 0.3931395478338345, "percentage": 1.97, "elapsed_time": "0:21:23", "remaining_time": "17:46:38", "throughput": 3347.88, "total_tokens": 4296160} +{"current_steps": 3535, "total_steps": 179580, "loss": 0.232, "lr": 9.839625793518208e-06, "epoch": 0.3936964027174518, "percentage": 1.97, "elapsed_time": "0:21:25", "remaining_time": "17:46:36", "throughput": 3347.9, "total_tokens": 4302240} +{"current_steps": 3540, "total_steps": 179580, "loss": 0.3132, "lr": 9.853547165608643e-06, "epoch": 0.39425325760106916, "percentage": 1.97, "elapsed_time": "0:21:26", "remaining_time": "17:46:37", "throughput": 3347.93, "total_tokens": 4308544} +{"current_steps": 3545, "total_steps": 179580, "loss": 0.3235, "lr": 9.867468537699075e-06, "epoch": 0.3948101124846865, "percentage": 1.97, "elapsed_time": "0:21:28", "remaining_time": "17:46:35", "throughput": 3347.94, "total_tokens": 4314624} +{"current_steps": 3550, "total_steps": 179580, "loss": 0.2028, "lr": 9.88138990978951e-06, "epoch": 0.39536696736830385, "percentage": 1.98, "elapsed_time": "0:21:30", "remaining_time": "17:46:33", "throughput": 3347.95, "total_tokens": 4320704} +{"current_steps": 3555, "total_steps": 179580, "loss": 0.2806, "lr": 9.895311281879942e-06, "epoch": 0.39592382225192113, "percentage": 1.98, "elapsed_time": "0:21:32", "remaining_time": "17:46:31", "throughput": 3347.94, "total_tokens": 4326752} +{"current_steps": 3560, "total_steps": 179580, "loss": 0.3294, "lr": 9.909232653970375e-06, "epoch": 0.3964806771355385, "percentage": 1.98, "elapsed_time": "0:21:34", "remaining_time": "17:46:34", "throughput": 3347.97, "total_tokens": 4333248} +{"current_steps": 3565, "total_steps": 179580, "loss": 0.3784, "lr": 9.92315402606081e-06, "epoch": 0.3970375320191558, "percentage": 1.99, "elapsed_time": "0:21:36", "remaining_time": "17:46:32", "throughput": 3348.0, "total_tokens": 4339360} +{"current_steps": 3570, "total_steps": 179580, "loss": 0.2632, "lr": 9.937075398151242e-06, "epoch": 0.39759438690277316, "percentage": 1.99, "elapsed_time": "0:21:37", "remaining_time": "17:46:32", "throughput": 3348.02, "total_tokens": 4345568} +{"current_steps": 3575, "total_steps": 179580, "loss": 0.2886, "lr": 9.950996770241676e-06, "epoch": 0.39815124178639044, "percentage": 1.99, "elapsed_time": "0:21:39", "remaining_time": "17:46:31", "throughput": 3348.09, "total_tokens": 4351840} +{"current_steps": 3580, "total_steps": 179580, "loss": 0.3477, "lr": 9.964918142332107e-06, "epoch": 0.3987080966700078, "percentage": 1.99, "elapsed_time": "0:21:41", "remaining_time": "17:46:29", "throughput": 3348.02, "total_tokens": 4357824} +{"current_steps": 3585, "total_steps": 179580, "loss": 0.2821, "lr": 9.978839514422542e-06, "epoch": 0.3992649515536251, "percentage": 2.0, "elapsed_time": "0:21:43", "remaining_time": "17:46:29", "throughput": 3348.02, "total_tokens": 4364000} +{"current_steps": 3590, "total_steps": 179580, "loss": 0.367, "lr": 9.992760886512976e-06, "epoch": 0.39982180643724247, "percentage": 2.0, "elapsed_time": "0:21:45", "remaining_time": "17:46:28", "throughput": 3348.09, "total_tokens": 4370272} +{"current_steps": 3595, "total_steps": 179580, "loss": 0.2392, "lr": 1.0006682258603409e-05, "epoch": 0.4003786613208598, "percentage": 2.0, "elapsed_time": "0:21:46", "remaining_time": "17:46:20", "throughput": 3348.06, "total_tokens": 4375840} +{"current_steps": 3600, "total_steps": 179580, "loss": 0.2406, "lr": 1.0020603630693843e-05, "epoch": 0.4009355162044771, "percentage": 2.0, "elapsed_time": "0:21:48", "remaining_time": "17:46:24", "throughput": 3348.1, "total_tokens": 4382432} +{"current_steps": 3605, "total_steps": 179580, "loss": 0.1032, "lr": 1.0034525002784274e-05, "epoch": 0.40149237108809444, "percentage": 2.01, "elapsed_time": "0:21:50", "remaining_time": "17:46:22", "throughput": 3348.12, "total_tokens": 4388512} +{"current_steps": 3610, "total_steps": 179580, "loss": 0.3647, "lr": 1.0048446374874708e-05, "epoch": 0.4020492259717118, "percentage": 2.01, "elapsed_time": "0:21:52", "remaining_time": "17:46:15", "throughput": 3348.07, "total_tokens": 4394144} +{"current_steps": 3615, "total_steps": 179580, "loss": 0.2033, "lr": 1.006236774696514e-05, "epoch": 0.4026060808553291, "percentage": 2.01, "elapsed_time": "0:21:54", "remaining_time": "17:46:08", "throughput": 3347.98, "total_tokens": 4399776} +{"current_steps": 3620, "total_steps": 179580, "loss": 0.1539, "lr": 1.0076289119055575e-05, "epoch": 0.4031629357389464, "percentage": 2.02, "elapsed_time": "0:21:55", "remaining_time": "17:46:02", "throughput": 3347.9, "total_tokens": 4405472} +{"current_steps": 3625, "total_steps": 179580, "loss": 0.2648, "lr": 1.0090210491146008e-05, "epoch": 0.40371979062256375, "percentage": 2.02, "elapsed_time": "0:21:57", "remaining_time": "17:46:05", "throughput": 3347.92, "total_tokens": 4411936} +{"current_steps": 3630, "total_steps": 179580, "loss": 0.3254, "lr": 1.010413186323644e-05, "epoch": 0.4042766455061811, "percentage": 2.02, "elapsed_time": "0:21:59", "remaining_time": "17:46:07", "throughput": 3347.94, "total_tokens": 4418304} +{"current_steps": 3635, "total_steps": 179580, "loss": 0.1429, "lr": 1.0118053235326875e-05, "epoch": 0.40483350038979843, "percentage": 2.02, "elapsed_time": "0:22:01", "remaining_time": "17:46:05", "throughput": 3347.93, "total_tokens": 4424320} +{"current_steps": 3640, "total_steps": 179580, "loss": 0.4855, "lr": 1.0131974607417307e-05, "epoch": 0.40539035527341577, "percentage": 2.03, "elapsed_time": "0:22:03", "remaining_time": "17:46:08", "throughput": 3347.94, "total_tokens": 4430752} +{"current_steps": 3645, "total_steps": 179580, "loss": 0.2047, "lr": 1.0145895979507742e-05, "epoch": 0.40594721015703306, "percentage": 2.03, "elapsed_time": "0:22:05", "remaining_time": "17:46:10", "throughput": 3347.93, "total_tokens": 4437088} +{"current_steps": 3650, "total_steps": 179580, "loss": 0.1724, "lr": 1.0159817351598173e-05, "epoch": 0.4065040650406504, "percentage": 2.03, "elapsed_time": "0:22:07", "remaining_time": "17:46:06", "throughput": 3347.89, "total_tokens": 4442976} +{"current_steps": 3655, "total_steps": 179580, "loss": 0.2123, "lr": 1.0173738723688607e-05, "epoch": 0.40706091992426774, "percentage": 2.04, "elapsed_time": "0:22:08", "remaining_time": "17:46:02", "throughput": 3347.94, "total_tokens": 4449024} +{"current_steps": 3660, "total_steps": 179580, "loss": 0.2398, "lr": 1.0187660095779041e-05, "epoch": 0.4076177748078851, "percentage": 2.04, "elapsed_time": "0:22:10", "remaining_time": "17:46:01", "throughput": 3347.87, "total_tokens": 4455040} +{"current_steps": 3665, "total_steps": 179580, "loss": 0.2482, "lr": 1.0201581467869474e-05, "epoch": 0.4081746296915024, "percentage": 2.04, "elapsed_time": "0:22:12", "remaining_time": "17:45:59", "throughput": 3347.85, "total_tokens": 4461088} +{"current_steps": 3670, "total_steps": 179580, "loss": 0.2614, "lr": 1.0215502839959908e-05, "epoch": 0.4087314845751197, "percentage": 2.04, "elapsed_time": "0:22:14", "remaining_time": "17:46:01", "throughput": 3347.89, "total_tokens": 4467520} +{"current_steps": 3675, "total_steps": 179580, "loss": 0.238, "lr": 1.022942421205034e-05, "epoch": 0.40928833945873705, "percentage": 2.05, "elapsed_time": "0:22:16", "remaining_time": "17:45:57", "throughput": 3347.87, "total_tokens": 4473440} +{"current_steps": 3680, "total_steps": 179580, "loss": 0.1707, "lr": 1.0243345584140773e-05, "epoch": 0.4098451943423544, "percentage": 2.05, "elapsed_time": "0:22:18", "remaining_time": "17:46:00", "throughput": 3347.89, "total_tokens": 4479904} +{"current_steps": 3685, "total_steps": 179580, "loss": 0.4047, "lr": 1.0257266956231206e-05, "epoch": 0.41040204922597173, "percentage": 2.05, "elapsed_time": "0:22:19", "remaining_time": "17:45:56", "throughput": 3347.94, "total_tokens": 4485856} +{"current_steps": 3690, "total_steps": 179580, "loss": 0.2353, "lr": 1.027118832832164e-05, "epoch": 0.410958904109589, "percentage": 2.05, "elapsed_time": "0:22:21", "remaining_time": "17:45:54", "throughput": 3348.01, "total_tokens": 4492032} +{"current_steps": 3695, "total_steps": 179580, "loss": 0.2677, "lr": 1.0285109700412073e-05, "epoch": 0.41151575899320636, "percentage": 2.06, "elapsed_time": "0:22:23", "remaining_time": "17:45:51", "throughput": 3348.02, "total_tokens": 4498080} +{"current_steps": 3700, "total_steps": 179580, "loss": 0.2811, "lr": 1.0299031072502506e-05, "epoch": 0.4120726138768237, "percentage": 2.06, "elapsed_time": "0:22:25", "remaining_time": "17:45:51", "throughput": 3348.02, "total_tokens": 4504256} +{"current_steps": 3705, "total_steps": 179580, "loss": 0.2685, "lr": 1.031295244459294e-05, "epoch": 0.41262946876044104, "percentage": 2.06, "elapsed_time": "0:22:27", "remaining_time": "17:45:51", "throughput": 3347.98, "total_tokens": 4510432} +{"current_steps": 3710, "total_steps": 179580, "loss": 0.2767, "lr": 1.0326873816683373e-05, "epoch": 0.4131863236440584, "percentage": 2.07, "elapsed_time": "0:22:29", "remaining_time": "17:45:54", "throughput": 3348.05, "total_tokens": 4516928} +{"current_steps": 3715, "total_steps": 179580, "loss": 0.3305, "lr": 1.0340795188773807e-05, "epoch": 0.41374317852767567, "percentage": 2.07, "elapsed_time": "0:22:30", "remaining_time": "17:45:53", "throughput": 3348.05, "total_tokens": 4523104} +{"current_steps": 3720, "total_steps": 179580, "loss": 0.2465, "lr": 1.0354716560864238e-05, "epoch": 0.414300033411293, "percentage": 2.07, "elapsed_time": "0:22:32", "remaining_time": "17:45:57", "throughput": 3348.12, "total_tokens": 4529696} +{"current_steps": 3725, "total_steps": 179580, "loss": 0.3976, "lr": 1.0368637932954672e-05, "epoch": 0.41485688829491035, "percentage": 2.07, "elapsed_time": "0:22:34", "remaining_time": "17:45:52", "throughput": 3348.02, "total_tokens": 4535392} +{"current_steps": 3730, "total_steps": 179580, "loss": 0.1716, "lr": 1.0382559305045107e-05, "epoch": 0.4154137431785277, "percentage": 2.08, "elapsed_time": "0:22:36", "remaining_time": "17:45:50", "throughput": 3348.05, "total_tokens": 4541504} +{"current_steps": 3735, "total_steps": 179580, "loss": 0.4936, "lr": 1.039648067713554e-05, "epoch": 0.415970598062145, "percentage": 2.08, "elapsed_time": "0:22:38", "remaining_time": "17:45:47", "throughput": 3348.09, "total_tokens": 4547616} +{"current_steps": 3740, "total_steps": 179580, "loss": 0.0939, "lr": 1.0410402049225972e-05, "epoch": 0.4165274529457623, "percentage": 2.08, "elapsed_time": "0:22:40", "remaining_time": "17:45:48", "throughput": 3348.09, "total_tokens": 4553856} +{"current_steps": 3745, "total_steps": 179580, "loss": 0.365, "lr": 1.0424323421316405e-05, "epoch": 0.41708430782937966, "percentage": 2.09, "elapsed_time": "0:22:41", "remaining_time": "17:45:44", "throughput": 3348.12, "total_tokens": 4559872} +{"current_steps": 3750, "total_steps": 179580, "loss": 0.1881, "lr": 1.0438244793406839e-05, "epoch": 0.417641162712997, "percentage": 2.09, "elapsed_time": "0:22:43", "remaining_time": "17:45:44", "throughput": 3348.17, "total_tokens": 4566144} +{"current_steps": 3755, "total_steps": 179580, "loss": 0.2507, "lr": 1.0452166165497271e-05, "epoch": 0.41819801759661435, "percentage": 2.09, "elapsed_time": "0:22:45", "remaining_time": "17:45:44", "throughput": 3348.13, "total_tokens": 4572320} +{"current_steps": 3760, "total_steps": 179580, "loss": 0.0467, "lr": 1.0466087537587706e-05, "epoch": 0.41875487248023163, "percentage": 2.09, "elapsed_time": "0:22:47", "remaining_time": "17:45:45", "throughput": 3348.13, "total_tokens": 4578560} +{"current_steps": 3765, "total_steps": 179580, "loss": 0.4241, "lr": 1.0480008909678138e-05, "epoch": 0.419311727363849, "percentage": 2.1, "elapsed_time": "0:22:49", "remaining_time": "17:45:40", "throughput": 3348.11, "total_tokens": 4584416} +{"current_steps": 3770, "total_steps": 179580, "loss": 0.178, "lr": 1.0493930281768571e-05, "epoch": 0.4198685822474663, "percentage": 2.1, "elapsed_time": "0:22:51", "remaining_time": "17:45:35", "throughput": 3348.15, "total_tokens": 4590336} +{"current_steps": 3775, "total_steps": 179580, "loss": 0.276, "lr": 1.0507851653859005e-05, "epoch": 0.42042543713108366, "percentage": 2.1, "elapsed_time": "0:22:52", "remaining_time": "17:45:34", "throughput": 3348.14, "total_tokens": 4596480} +{"current_steps": 3780, "total_steps": 179580, "loss": 0.2409, "lr": 1.0521773025949438e-05, "epoch": 0.42098229201470094, "percentage": 2.1, "elapsed_time": "0:22:54", "remaining_time": "17:45:31", "throughput": 3348.13, "total_tokens": 4602496} +{"current_steps": 3785, "total_steps": 179580, "loss": 0.2159, "lr": 1.053569439803987e-05, "epoch": 0.4215391468983183, "percentage": 2.11, "elapsed_time": "0:22:56", "remaining_time": "17:45:31", "throughput": 3348.14, "total_tokens": 4608672} +{"current_steps": 3790, "total_steps": 179580, "loss": 0.1032, "lr": 1.0549615770130305e-05, "epoch": 0.4220960017819356, "percentage": 2.11, "elapsed_time": "0:22:58", "remaining_time": "17:45:27", "throughput": 3348.11, "total_tokens": 4614560} +{"current_steps": 3795, "total_steps": 179580, "loss": 0.2612, "lr": 1.0563537142220738e-05, "epoch": 0.42265285666555297, "percentage": 2.11, "elapsed_time": "0:23:00", "remaining_time": "17:45:26", "throughput": 3348.16, "total_tokens": 4620832} +{"current_steps": 3800, "total_steps": 179580, "loss": 0.3052, "lr": 1.0577458514311172e-05, "epoch": 0.4232097115491703, "percentage": 2.12, "elapsed_time": "0:23:01", "remaining_time": "17:45:28", "throughput": 3348.17, "total_tokens": 4627168} +{"current_steps": 3805, "total_steps": 179580, "loss": 0.2741, "lr": 1.0591379886401605e-05, "epoch": 0.4237665664327876, "percentage": 2.12, "elapsed_time": "0:23:03", "remaining_time": "17:45:27", "throughput": 3348.23, "total_tokens": 4633440} +{"current_steps": 3810, "total_steps": 179580, "loss": 0.5407, "lr": 1.0605301258492037e-05, "epoch": 0.42432342131640494, "percentage": 2.12, "elapsed_time": "0:23:05", "remaining_time": "17:45:25", "throughput": 3348.26, "total_tokens": 4639520} +{"current_steps": 3815, "total_steps": 179580, "loss": 0.1965, "lr": 1.061922263058247e-05, "epoch": 0.4248802762000223, "percentage": 2.12, "elapsed_time": "0:23:07", "remaining_time": "17:45:24", "throughput": 3348.23, "total_tokens": 4645600} +{"current_steps": 3820, "total_steps": 179580, "loss": 0.4194, "lr": 1.0633144002672904e-05, "epoch": 0.4254371310836396, "percentage": 2.13, "elapsed_time": "0:23:09", "remaining_time": "17:45:20", "throughput": 3348.22, "total_tokens": 4651552} +{"current_steps": 3825, "total_steps": 179580, "loss": 0.1931, "lr": 1.0647065374763337e-05, "epoch": 0.4259939859672569, "percentage": 2.13, "elapsed_time": "0:23:11", "remaining_time": "17:45:17", "throughput": 3348.17, "total_tokens": 4657504} +{"current_steps": 3830, "total_steps": 179580, "loss": 0.1493, "lr": 1.0660986746853771e-05, "epoch": 0.42655084085087425, "percentage": 2.13, "elapsed_time": "0:23:12", "remaining_time": "17:45:16", "throughput": 3348.16, "total_tokens": 4663616} +{"current_steps": 3835, "total_steps": 179580, "loss": 0.223, "lr": 1.0674908118944204e-05, "epoch": 0.4271076957344916, "percentage": 2.14, "elapsed_time": "0:23:14", "remaining_time": "17:45:13", "throughput": 3348.09, "total_tokens": 4669504} +{"current_steps": 3840, "total_steps": 179580, "loss": 0.2214, "lr": 1.0688829491034636e-05, "epoch": 0.42766455061810893, "percentage": 2.14, "elapsed_time": "0:23:16", "remaining_time": "17:45:06", "throughput": 3348.04, "total_tokens": 4675136} +{"current_steps": 3845, "total_steps": 179580, "loss": 0.3096, "lr": 1.070275086312507e-05, "epoch": 0.42822140550172627, "percentage": 2.14, "elapsed_time": "0:23:18", "remaining_time": "17:45:03", "throughput": 3348.05, "total_tokens": 4681184} +{"current_steps": 3850, "total_steps": 179580, "loss": 0.3149, "lr": 1.0716672235215503e-05, "epoch": 0.42877826038534356, "percentage": 2.14, "elapsed_time": "0:23:19", "remaining_time": "17:45:01", "throughput": 3348.04, "total_tokens": 4687200} +{"current_steps": 3855, "total_steps": 179580, "loss": 0.1225, "lr": 1.0730593607305936e-05, "epoch": 0.4293351152689609, "percentage": 2.15, "elapsed_time": "0:23:21", "remaining_time": "17:44:57", "throughput": 3348.08, "total_tokens": 4693248} +{"current_steps": 3860, "total_steps": 179580, "loss": 0.2075, "lr": 1.074451497939637e-05, "epoch": 0.42989197015257824, "percentage": 2.15, "elapsed_time": "0:23:23", "remaining_time": "17:44:55", "throughput": 3348.09, "total_tokens": 4699296} +{"current_steps": 3865, "total_steps": 179580, "loss": 0.1414, "lr": 1.0758436351486803e-05, "epoch": 0.4304488250361956, "percentage": 2.15, "elapsed_time": "0:23:25", "remaining_time": "17:44:52", "throughput": 3348.05, "total_tokens": 4705216} +{"current_steps": 3870, "total_steps": 179580, "loss": 0.2018, "lr": 1.0772357723577237e-05, "epoch": 0.4310056799198129, "percentage": 2.16, "elapsed_time": "0:23:27", "remaining_time": "17:44:50", "throughput": 3348.01, "total_tokens": 4711264} +{"current_steps": 3875, "total_steps": 179580, "loss": 0.3243, "lr": 1.078627909566767e-05, "epoch": 0.4315625348034302, "percentage": 2.16, "elapsed_time": "0:23:29", "remaining_time": "17:44:52", "throughput": 3348.07, "total_tokens": 4717728} +{"current_steps": 3880, "total_steps": 179580, "loss": 0.3273, "lr": 1.0800200467758103e-05, "epoch": 0.43211938968704755, "percentage": 2.16, "elapsed_time": "0:23:30", "remaining_time": "17:44:53", "throughput": 3348.0, "total_tokens": 4723936} +{"current_steps": 3885, "total_steps": 179580, "loss": 0.2744, "lr": 1.0814121839848535e-05, "epoch": 0.4326762445706649, "percentage": 2.16, "elapsed_time": "0:23:32", "remaining_time": "17:44:55", "throughput": 3348.04, "total_tokens": 4730368} +{"current_steps": 3890, "total_steps": 179580, "loss": 0.0902, "lr": 1.082804321193897e-05, "epoch": 0.43323309945428223, "percentage": 2.17, "elapsed_time": "0:23:34", "remaining_time": "17:44:48", "throughput": 3347.97, "total_tokens": 4735936} +{"current_steps": 3895, "total_steps": 179580, "loss": 0.2725, "lr": 1.0841964584029402e-05, "epoch": 0.4337899543378995, "percentage": 2.17, "elapsed_time": "0:23:36", "remaining_time": "17:44:44", "throughput": 3347.92, "total_tokens": 4741824} +{"current_steps": 3900, "total_steps": 179580, "loss": 0.3214, "lr": 1.0855885956119835e-05, "epoch": 0.43434680922151686, "percentage": 2.17, "elapsed_time": "0:23:38", "remaining_time": "17:44:45", "throughput": 3347.92, "total_tokens": 4748128} +{"current_steps": 3905, "total_steps": 179580, "loss": 0.2283, "lr": 1.0869807328210269e-05, "epoch": 0.4349036641051342, "percentage": 2.17, "elapsed_time": "0:23:40", "remaining_time": "17:44:42", "throughput": 3347.98, "total_tokens": 4754208} +{"current_steps": 3910, "total_steps": 179580, "loss": 0.1447, "lr": 1.0883728700300702e-05, "epoch": 0.43546051898875154, "percentage": 2.18, "elapsed_time": "0:23:41", "remaining_time": "17:44:41", "throughput": 3347.96, "total_tokens": 4760320} +{"current_steps": 3915, "total_steps": 179580, "loss": 0.2359, "lr": 1.0897650072391136e-05, "epoch": 0.4360173738723689, "percentage": 2.18, "elapsed_time": "0:23:43", "remaining_time": "17:44:43", "throughput": 3347.96, "total_tokens": 4766656} +{"current_steps": 3920, "total_steps": 179580, "loss": 0.1818, "lr": 1.0911571444481569e-05, "epoch": 0.43657422875598617, "percentage": 2.18, "elapsed_time": "0:23:45", "remaining_time": "17:44:42", "throughput": 3347.94, "total_tokens": 4772768} +{"current_steps": 3925, "total_steps": 179580, "loss": 0.2875, "lr": 1.0925492816572001e-05, "epoch": 0.4371310836396035, "percentage": 2.19, "elapsed_time": "0:23:47", "remaining_time": "17:44:35", "throughput": 3347.92, "total_tokens": 4778464} +{"current_steps": 3930, "total_steps": 179580, "loss": 0.2309, "lr": 1.0939414188662436e-05, "epoch": 0.43768793852322085, "percentage": 2.19, "elapsed_time": "0:23:49", "remaining_time": "17:44:37", "throughput": 3347.97, "total_tokens": 4784896} +{"current_steps": 3935, "total_steps": 179580, "loss": 0.2215, "lr": 1.0953335560752868e-05, "epoch": 0.4382447934068382, "percentage": 2.19, "elapsed_time": "0:23:50", "remaining_time": "17:44:31", "throughput": 3347.91, "total_tokens": 4790624} +{"current_steps": 3940, "total_steps": 179580, "loss": 0.3465, "lr": 1.0967256932843303e-05, "epoch": 0.4388016482904555, "percentage": 2.19, "elapsed_time": "0:23:52", "remaining_time": "17:44:30", "throughput": 3347.88, "total_tokens": 4796704} +{"current_steps": 3945, "total_steps": 179580, "loss": 0.3316, "lr": 1.0981178304933734e-05, "epoch": 0.4393585031740728, "percentage": 2.2, "elapsed_time": "0:23:54", "remaining_time": "17:44:29", "throughput": 3347.87, "total_tokens": 4802848} +{"current_steps": 3950, "total_steps": 179580, "loss": 0.334, "lr": 1.0995099677024168e-05, "epoch": 0.43991535805769016, "percentage": 2.2, "elapsed_time": "0:23:56", "remaining_time": "17:44:24", "throughput": 3347.87, "total_tokens": 4808672} +{"current_steps": 3955, "total_steps": 179580, "loss": 0.3684, "lr": 1.10090210491146e-05, "epoch": 0.4404722129413075, "percentage": 2.2, "elapsed_time": "0:23:58", "remaining_time": "17:44:22", "throughput": 3347.86, "total_tokens": 4814720} +{"current_steps": 3960, "total_steps": 179580, "loss": 0.3079, "lr": 1.1022942421205035e-05, "epoch": 0.44102906782492485, "percentage": 2.21, "elapsed_time": "0:23:59", "remaining_time": "17:44:20", "throughput": 3347.92, "total_tokens": 4820896} +{"current_steps": 3965, "total_steps": 179580, "loss": 0.2952, "lr": 1.1036863793295468e-05, "epoch": 0.44158592270854213, "percentage": 2.21, "elapsed_time": "0:24:01", "remaining_time": "17:44:18", "throughput": 3347.94, "total_tokens": 4826976} +{"current_steps": 3970, "total_steps": 179580, "loss": 0.2037, "lr": 1.10507851653859e-05, "epoch": 0.4421427775921595, "percentage": 2.21, "elapsed_time": "0:24:03", "remaining_time": "17:44:12", "throughput": 3348.0, "total_tokens": 4832896} +{"current_steps": 3975, "total_steps": 179580, "loss": 0.217, "lr": 1.1064706537476335e-05, "epoch": 0.4426996324757768, "percentage": 2.21, "elapsed_time": "0:24:05", "remaining_time": "17:44:12", "throughput": 3348.07, "total_tokens": 4839200} +{"current_steps": 3980, "total_steps": 179580, "loss": 0.0733, "lr": 1.1078627909566767e-05, "epoch": 0.44325648735939416, "percentage": 2.22, "elapsed_time": "0:24:07", "remaining_time": "17:44:11", "throughput": 3348.08, "total_tokens": 4845376} +{"current_steps": 3985, "total_steps": 179580, "loss": 0.1804, "lr": 1.1092549281657201e-05, "epoch": 0.44381334224301144, "percentage": 2.22, "elapsed_time": "0:24:08", "remaining_time": "17:44:06", "throughput": 3348.05, "total_tokens": 4851168} +{"current_steps": 3990, "total_steps": 179580, "loss": 0.2313, "lr": 1.1106470653747634e-05, "epoch": 0.4443701971266288, "percentage": 2.22, "elapsed_time": "0:24:10", "remaining_time": "17:43:57", "throughput": 3348.0, "total_tokens": 4856608} +{"current_steps": 3995, "total_steps": 179580, "loss": 0.1877, "lr": 1.1120392025838067e-05, "epoch": 0.4449270520102461, "percentage": 2.22, "elapsed_time": "0:24:12", "remaining_time": "17:43:50", "throughput": 3347.92, "total_tokens": 4862176} +{"current_steps": 4000, "total_steps": 179580, "loss": 0.149, "lr": 1.1134313397928501e-05, "epoch": 0.44548390689386347, "percentage": 2.23, "elapsed_time": "0:24:14", "remaining_time": "17:43:47", "throughput": 3347.9, "total_tokens": 4868192} +{"current_steps": 4005, "total_steps": 179580, "loss": 0.2756, "lr": 1.1148234770018934e-05, "epoch": 0.4460407617774808, "percentage": 2.23, "elapsed_time": "0:24:15", "remaining_time": "17:43:47", "throughput": 3347.92, "total_tokens": 4874400} +{"current_steps": 4010, "total_steps": 179580, "loss": 0.2676, "lr": 1.1162156142109368e-05, "epoch": 0.4465976166610981, "percentage": 2.23, "elapsed_time": "0:24:17", "remaining_time": "17:43:43", "throughput": 3347.96, "total_tokens": 4880416} +{"current_steps": 4015, "total_steps": 179580, "loss": 0.2529, "lr": 1.1176077514199799e-05, "epoch": 0.44715447154471544, "percentage": 2.24, "elapsed_time": "0:24:19", "remaining_time": "17:43:40", "throughput": 3347.93, "total_tokens": 4886368} +{"current_steps": 4020, "total_steps": 179580, "loss": 0.1835, "lr": 1.1189998886290233e-05, "epoch": 0.4477113264283328, "percentage": 2.24, "elapsed_time": "0:24:21", "remaining_time": "17:43:41", "throughput": 3347.93, "total_tokens": 4892608} +{"current_steps": 4025, "total_steps": 179580, "loss": 0.1814, "lr": 1.1203920258380666e-05, "epoch": 0.4482681813119501, "percentage": 2.24, "elapsed_time": "0:24:23", "remaining_time": "17:43:39", "throughput": 3347.93, "total_tokens": 4898752} +{"current_steps": 4030, "total_steps": 179580, "loss": 0.2948, "lr": 1.12178416304711e-05, "epoch": 0.44882503619556746, "percentage": 2.24, "elapsed_time": "0:24:24", "remaining_time": "17:43:35", "throughput": 3347.88, "total_tokens": 4904576} +{"current_steps": 4035, "total_steps": 179580, "loss": 0.1492, "lr": 1.1231763002561533e-05, "epoch": 0.44938189107918475, "percentage": 2.25, "elapsed_time": "0:24:26", "remaining_time": "17:43:33", "throughput": 3347.87, "total_tokens": 4910592} +{"current_steps": 4040, "total_steps": 179580, "loss": 0.4213, "lr": 1.1245684374651966e-05, "epoch": 0.4499387459628021, "percentage": 2.25, "elapsed_time": "0:24:28", "remaining_time": "17:43:29", "throughput": 3347.86, "total_tokens": 4916512} +{"current_steps": 4045, "total_steps": 179580, "loss": 0.4181, "lr": 1.12596057467424e-05, "epoch": 0.45049560084641943, "percentage": 2.25, "elapsed_time": "0:24:30", "remaining_time": "17:43:28", "throughput": 3347.89, "total_tokens": 4922720} +{"current_steps": 4050, "total_steps": 179580, "loss": 0.136, "lr": 1.1273527118832832e-05, "epoch": 0.45105245573003677, "percentage": 2.26, "elapsed_time": "0:24:32", "remaining_time": "17:43:27", "throughput": 3347.85, "total_tokens": 4928800} +{"current_steps": 4055, "total_steps": 179580, "loss": 0.4609, "lr": 1.1287448490923267e-05, "epoch": 0.45160931061365406, "percentage": 2.26, "elapsed_time": "0:24:34", "remaining_time": "17:43:24", "throughput": 3347.85, "total_tokens": 4934816} +{"current_steps": 4060, "total_steps": 179580, "loss": 0.2122, "lr": 1.1301369863013698e-05, "epoch": 0.4521661654972714, "percentage": 2.26, "elapsed_time": "0:24:35", "remaining_time": "17:43:22", "throughput": 3347.8, "total_tokens": 4940768} +{"current_steps": 4065, "total_steps": 179580, "loss": 0.2914, "lr": 1.1315291235104132e-05, "epoch": 0.45272302038088874, "percentage": 2.26, "elapsed_time": "0:24:37", "remaining_time": "17:43:19", "throughput": 3347.8, "total_tokens": 4946816} +{"current_steps": 4070, "total_steps": 179580, "loss": 0.1229, "lr": 1.1329212607194566e-05, "epoch": 0.4532798752645061, "percentage": 2.27, "elapsed_time": "0:24:39", "remaining_time": "17:43:20", "throughput": 3347.84, "total_tokens": 4953152} +{"current_steps": 4075, "total_steps": 179580, "loss": 0.4184, "lr": 1.1343133979284999e-05, "epoch": 0.4538367301481234, "percentage": 2.27, "elapsed_time": "0:24:41", "remaining_time": "17:43:18", "throughput": 3347.89, "total_tokens": 4959296} +{"current_steps": 4080, "total_steps": 179580, "loss": 0.1288, "lr": 1.1357055351375433e-05, "epoch": 0.4543935850317407, "percentage": 2.27, "elapsed_time": "0:24:43", "remaining_time": "17:43:18", "throughput": 3347.93, "total_tokens": 4965600} +{"current_steps": 4085, "total_steps": 179580, "loss": 0.3127, "lr": 1.1370976723465864e-05, "epoch": 0.45495043991535805, "percentage": 2.27, "elapsed_time": "0:24:45", "remaining_time": "17:43:18", "throughput": 3347.93, "total_tokens": 4971776} +{"current_steps": 4090, "total_steps": 179580, "loss": 0.3326, "lr": 1.1384898095556299e-05, "epoch": 0.4555072947989754, "percentage": 2.28, "elapsed_time": "0:24:46", "remaining_time": "17:43:16", "throughput": 3347.93, "total_tokens": 4977920} +{"current_steps": 4095, "total_steps": 179580, "loss": 0.2133, "lr": 1.1398819467646731e-05, "epoch": 0.45606414968259273, "percentage": 2.28, "elapsed_time": "0:24:48", "remaining_time": "17:43:16", "throughput": 3347.92, "total_tokens": 4984128} +{"current_steps": 4100, "total_steps": 179580, "loss": 0.1112, "lr": 1.1412740839737166e-05, "epoch": 0.45662100456621, "percentage": 2.28, "elapsed_time": "0:24:50", "remaining_time": "17:43:17", "throughput": 3347.98, "total_tokens": 4990496} +{"current_steps": 4105, "total_steps": 179580, "loss": 0.2156, "lr": 1.1426662211827598e-05, "epoch": 0.45717785944982736, "percentage": 2.29, "elapsed_time": "0:24:52", "remaining_time": "17:43:15", "throughput": 3348.0, "total_tokens": 4996608} +{"current_steps": 4110, "total_steps": 179580, "loss": 0.2838, "lr": 1.1440583583918031e-05, "epoch": 0.4577347143334447, "percentage": 2.29, "elapsed_time": "0:24:54", "remaining_time": "17:43:17", "throughput": 3348.05, "total_tokens": 5003040} +{"current_steps": 4115, "total_steps": 179580, "loss": 0.2333, "lr": 1.1454504956008465e-05, "epoch": 0.45829156921706204, "percentage": 2.29, "elapsed_time": "0:24:56", "remaining_time": "17:43:18", "throughput": 3348.07, "total_tokens": 5009344} +{"current_steps": 4120, "total_steps": 179580, "loss": 0.3028, "lr": 1.1468426328098898e-05, "epoch": 0.4588484241006794, "percentage": 2.29, "elapsed_time": "0:24:58", "remaining_time": "17:43:16", "throughput": 3348.03, "total_tokens": 5015424} +{"current_steps": 4125, "total_steps": 179580, "loss": 0.1096, "lr": 1.1482347700189332e-05, "epoch": 0.45940527898429667, "percentage": 2.3, "elapsed_time": "0:24:59", "remaining_time": "17:43:15", "throughput": 3348.02, "total_tokens": 5021568} +{"current_steps": 4130, "total_steps": 179580, "loss": 0.2788, "lr": 1.1496269072279763e-05, "epoch": 0.459962133867914, "percentage": 2.3, "elapsed_time": "0:25:01", "remaining_time": "17:43:13", "throughput": 3348.03, "total_tokens": 5027648} +{"current_steps": 4135, "total_steps": 179580, "loss": 0.1881, "lr": 1.1510190444370197e-05, "epoch": 0.46051898875153136, "percentage": 2.3, "elapsed_time": "0:25:03", "remaining_time": "17:43:13", "throughput": 3348.07, "total_tokens": 5033920} +{"current_steps": 4140, "total_steps": 179580, "loss": 0.2803, "lr": 1.1524111816460632e-05, "epoch": 0.4610758436351487, "percentage": 2.31, "elapsed_time": "0:25:05", "remaining_time": "17:43:08", "throughput": 3348.08, "total_tokens": 5039776} +{"current_steps": 4145, "total_steps": 179580, "loss": 0.1198, "lr": 1.1538033188551064e-05, "epoch": 0.461632698518766, "percentage": 2.31, "elapsed_time": "0:25:07", "remaining_time": "17:43:07", "throughput": 3348.06, "total_tokens": 5045920} +{"current_steps": 4150, "total_steps": 179580, "loss": 0.2158, "lr": 1.1551954560641499e-05, "epoch": 0.4621895534023833, "percentage": 2.31, "elapsed_time": "0:25:09", "remaining_time": "17:43:10", "throughput": 3348.12, "total_tokens": 5052480} +{"current_steps": 4155, "total_steps": 179580, "loss": 0.2657, "lr": 1.156587593273193e-05, "epoch": 0.46274640828600067, "percentage": 2.31, "elapsed_time": "0:25:10", "remaining_time": "17:43:12", "throughput": 3348.17, "total_tokens": 5058944} +{"current_steps": 4160, "total_steps": 179580, "loss": 0.3213, "lr": 1.1579797304822364e-05, "epoch": 0.463303263169618, "percentage": 2.32, "elapsed_time": "0:25:12", "remaining_time": "17:43:10", "throughput": 3348.18, "total_tokens": 5065024} +{"current_steps": 4165, "total_steps": 179580, "loss": 0.3873, "lr": 1.1593718676912797e-05, "epoch": 0.46386011805323535, "percentage": 2.32, "elapsed_time": "0:25:14", "remaining_time": "17:43:10", "throughput": 3348.17, "total_tokens": 5071232} +{"current_steps": 4170, "total_steps": 179580, "loss": 0.2101, "lr": 1.1607640049003231e-05, "epoch": 0.46441697293685263, "percentage": 2.32, "elapsed_time": "0:25:16", "remaining_time": "17:43:13", "throughput": 3348.21, "total_tokens": 5077760} +{"current_steps": 4175, "total_steps": 179580, "loss": 0.2815, "lr": 1.1621561421093664e-05, "epoch": 0.46497382782047, "percentage": 2.32, "elapsed_time": "0:25:18", "remaining_time": "17:43:07", "throughput": 3348.14, "total_tokens": 5083392} +{"current_steps": 4180, "total_steps": 179580, "loss": 0.2434, "lr": 1.1635482793184096e-05, "epoch": 0.4655306827040873, "percentage": 2.33, "elapsed_time": "0:25:20", "remaining_time": "17:43:06", "throughput": 3348.14, "total_tokens": 5089536} +{"current_steps": 4185, "total_steps": 179580, "loss": 0.4052, "lr": 1.164940416527453e-05, "epoch": 0.46608753758770466, "percentage": 2.33, "elapsed_time": "0:25:21", "remaining_time": "17:43:05", "throughput": 3348.13, "total_tokens": 5095680} +{"current_steps": 4190, "total_steps": 179580, "loss": 0.3094, "lr": 1.1663325537364963e-05, "epoch": 0.466644392471322, "percentage": 2.33, "elapsed_time": "0:25:23", "remaining_time": "17:43:06", "throughput": 3348.13, "total_tokens": 5102016} +{"current_steps": 4195, "total_steps": 179580, "loss": 0.2389, "lr": 1.1677246909455398e-05, "epoch": 0.4672012473549393, "percentage": 2.34, "elapsed_time": "0:25:25", "remaining_time": "17:43:08", "throughput": 3348.18, "total_tokens": 5108448} +{"current_steps": 4200, "total_steps": 179580, "loss": 0.3028, "lr": 1.1691168281545828e-05, "epoch": 0.46775810223855663, "percentage": 2.34, "elapsed_time": "0:25:27", "remaining_time": "17:43:07", "throughput": 3348.19, "total_tokens": 5114624} +{"current_steps": 4205, "total_steps": 179580, "loss": 0.3461, "lr": 1.1705089653636263e-05, "epoch": 0.46831495712217397, "percentage": 2.34, "elapsed_time": "0:25:29", "remaining_time": "17:43:05", "throughput": 3348.22, "total_tokens": 5120736} +{"current_steps": 4210, "total_steps": 179580, "loss": 0.2601, "lr": 1.1719011025726697e-05, "epoch": 0.4688718120057913, "percentage": 2.34, "elapsed_time": "0:25:31", "remaining_time": "17:43:00", "throughput": 3348.24, "total_tokens": 5126656} +{"current_steps": 4215, "total_steps": 179580, "loss": 0.2805, "lr": 1.173293239781713e-05, "epoch": 0.4694286668894086, "percentage": 2.35, "elapsed_time": "0:25:32", "remaining_time": "17:42:58", "throughput": 3348.22, "total_tokens": 5132640} +{"current_steps": 4220, "total_steps": 179580, "loss": 0.2894, "lr": 1.1746853769907562e-05, "epoch": 0.46998552177302594, "percentage": 2.35, "elapsed_time": "0:25:34", "remaining_time": "17:42:54", "throughput": 3348.2, "total_tokens": 5138560} +{"current_steps": 4225, "total_steps": 179580, "loss": 0.4063, "lr": 1.1760775141997995e-05, "epoch": 0.4705423766566433, "percentage": 2.35, "elapsed_time": "0:25:36", "remaining_time": "17:42:53", "throughput": 3348.19, "total_tokens": 5144704} +{"current_steps": 4230, "total_steps": 179580, "loss": 0.1866, "lr": 1.177469651408843e-05, "epoch": 0.4710992315402606, "percentage": 2.36, "elapsed_time": "0:25:38", "remaining_time": "17:42:50", "throughput": 3348.17, "total_tokens": 5150656} +{"current_steps": 4235, "total_steps": 179580, "loss": 0.2361, "lr": 1.1788617886178862e-05, "epoch": 0.47165608642387796, "percentage": 2.36, "elapsed_time": "0:25:40", "remaining_time": "17:42:51", "throughput": 3348.18, "total_tokens": 5156960} +{"current_steps": 4240, "total_steps": 179580, "loss": 0.2444, "lr": 1.1802539258269296e-05, "epoch": 0.47221294130749525, "percentage": 2.36, "elapsed_time": "0:25:42", "remaining_time": "17:42:47", "throughput": 3348.17, "total_tokens": 5162880} +{"current_steps": 4245, "total_steps": 179580, "loss": 0.4832, "lr": 1.1816460630359729e-05, "epoch": 0.4727697961911126, "percentage": 2.36, "elapsed_time": "0:25:43", "remaining_time": "17:42:47", "throughput": 3348.22, "total_tokens": 5169216} +{"current_steps": 4250, "total_steps": 179580, "loss": 0.2215, "lr": 1.1830382002450162e-05, "epoch": 0.47332665107472993, "percentage": 2.37, "elapsed_time": "0:25:45", "remaining_time": "17:42:44", "throughput": 3348.23, "total_tokens": 5175200} +{"current_steps": 4255, "total_steps": 179580, "loss": 0.2079, "lr": 1.1844303374540596e-05, "epoch": 0.4738835059583473, "percentage": 2.37, "elapsed_time": "0:25:47", "remaining_time": "17:42:42", "throughput": 3348.23, "total_tokens": 5181248} +{"current_steps": 4260, "total_steps": 179580, "loss": 0.327, "lr": 1.1858224746631029e-05, "epoch": 0.47444036084196456, "percentage": 2.37, "elapsed_time": "0:25:49", "remaining_time": "17:42:44", "throughput": 3348.22, "total_tokens": 5187680} +{"current_steps": 4265, "total_steps": 179580, "loss": 0.2996, "lr": 1.1872146118721461e-05, "epoch": 0.4749972157255819, "percentage": 2.37, "elapsed_time": "0:25:51", "remaining_time": "17:42:45", "throughput": 3348.33, "total_tokens": 5194176} +{"current_steps": 4270, "total_steps": 179580, "loss": 0.2809, "lr": 1.1886067490811894e-05, "epoch": 0.47555407060919924, "percentage": 2.38, "elapsed_time": "0:25:53", "remaining_time": "17:42:44", "throughput": 3348.34, "total_tokens": 5200352} +{"current_steps": 4275, "total_steps": 179580, "loss": 0.2134, "lr": 1.1899988862902328e-05, "epoch": 0.4761109254928166, "percentage": 2.38, "elapsed_time": "0:25:54", "remaining_time": "17:42:40", "throughput": 3348.28, "total_tokens": 5206176} +{"current_steps": 4280, "total_steps": 179580, "loss": 0.3709, "lr": 1.1913910234992762e-05, "epoch": 0.4766677803764339, "percentage": 2.38, "elapsed_time": "0:25:56", "remaining_time": "17:42:43", "throughput": 3348.29, "total_tokens": 5212608} +{"current_steps": 4285, "total_steps": 179580, "loss": 0.2234, "lr": 1.1927831607083195e-05, "epoch": 0.4772246352600512, "percentage": 2.39, "elapsed_time": "0:25:58", "remaining_time": "17:42:40", "throughput": 3348.32, "total_tokens": 5218656} +{"current_steps": 4290, "total_steps": 179580, "loss": 0.1728, "lr": 1.1941752979173628e-05, "epoch": 0.47778149014366855, "percentage": 2.39, "elapsed_time": "0:26:00", "remaining_time": "17:42:40", "throughput": 3348.32, "total_tokens": 5224928} +{"current_steps": 4295, "total_steps": 179580, "loss": 0.2852, "lr": 1.195567435126406e-05, "epoch": 0.4783383450272859, "percentage": 2.39, "elapsed_time": "0:26:02", "remaining_time": "17:42:38", "throughput": 3348.27, "total_tokens": 5230880} +{"current_steps": 4300, "total_steps": 179580, "loss": 0.4728, "lr": 1.1969595723354495e-05, "epoch": 0.47889519991090324, "percentage": 2.39, "elapsed_time": "0:26:04", "remaining_time": "17:42:34", "throughput": 3348.22, "total_tokens": 5236736} +{"current_steps": 4305, "total_steps": 179580, "loss": 0.3962, "lr": 1.1983517095444927e-05, "epoch": 0.4794520547945205, "percentage": 2.4, "elapsed_time": "0:26:05", "remaining_time": "17:42:34", "throughput": 3348.19, "total_tokens": 5242912} +{"current_steps": 4310, "total_steps": 179580, "loss": 0.2259, "lr": 1.1997438467535362e-05, "epoch": 0.48000890967813786, "percentage": 2.4, "elapsed_time": "0:26:07", "remaining_time": "17:42:32", "throughput": 3348.2, "total_tokens": 5249056} +{"current_steps": 4315, "total_steps": 179580, "loss": 0.248, "lr": 1.2011359839625794e-05, "epoch": 0.4805657645617552, "percentage": 2.4, "elapsed_time": "0:26:09", "remaining_time": "17:42:29", "throughput": 3348.18, "total_tokens": 5254976} +{"current_steps": 4320, "total_steps": 179580, "loss": 0.4667, "lr": 1.2025281211716227e-05, "epoch": 0.48112261944537255, "percentage": 2.41, "elapsed_time": "0:26:11", "remaining_time": "17:42:27", "throughput": 3348.18, "total_tokens": 5261088} +{"current_steps": 4325, "total_steps": 179580, "loss": 0.1348, "lr": 1.2039202583806661e-05, "epoch": 0.4816794743289899, "percentage": 2.41, "elapsed_time": "0:26:13", "remaining_time": "17:42:25", "throughput": 3348.16, "total_tokens": 5267104} +{"current_steps": 4330, "total_steps": 179580, "loss": 0.1098, "lr": 1.2053123955897094e-05, "epoch": 0.4822363292126072, "percentage": 2.41, "elapsed_time": "0:26:14", "remaining_time": "17:42:24", "throughput": 3348.1, "total_tokens": 5273120} +{"current_steps": 4335, "total_steps": 179580, "loss": 0.2137, "lr": 1.2067045327987527e-05, "epoch": 0.4827931840962245, "percentage": 2.41, "elapsed_time": "0:26:16", "remaining_time": "17:42:12", "throughput": 3347.99, "total_tokens": 5278240} +{"current_steps": 4340, "total_steps": 179580, "loss": 0.1889, "lr": 1.208096670007796e-05, "epoch": 0.48335003897984186, "percentage": 2.42, "elapsed_time": "0:26:18", "remaining_time": "17:42:12", "throughput": 3348.02, "total_tokens": 5284512} +{"current_steps": 4345, "total_steps": 179580, "loss": 0.2551, "lr": 1.2094888072168393e-05, "epoch": 0.4839068938634592, "percentage": 2.42, "elapsed_time": "0:26:20", "remaining_time": "17:42:08", "throughput": 3348.02, "total_tokens": 5290432} +{"current_steps": 4350, "total_steps": 179580, "loss": 0.242, "lr": 1.2108809444258828e-05, "epoch": 0.48446374874707654, "percentage": 2.42, "elapsed_time": "0:26:22", "remaining_time": "17:42:07", "throughput": 3348.05, "total_tokens": 5296640} +{"current_steps": 4355, "total_steps": 179580, "loss": 0.2512, "lr": 1.212273081634926e-05, "epoch": 0.4850206036306938, "percentage": 2.43, "elapsed_time": "0:26:23", "remaining_time": "17:42:05", "throughput": 3348.06, "total_tokens": 5302720} +{"current_steps": 4360, "total_steps": 179580, "loss": 0.2476, "lr": 1.2136652188439693e-05, "epoch": 0.48557745851431117, "percentage": 2.43, "elapsed_time": "0:26:25", "remaining_time": "17:42:05", "throughput": 3348.02, "total_tokens": 5308864} +{"current_steps": 4365, "total_steps": 179580, "loss": 0.2881, "lr": 1.2150573560530126e-05, "epoch": 0.4861343133979285, "percentage": 2.43, "elapsed_time": "0:26:27", "remaining_time": "17:41:58", "throughput": 3347.94, "total_tokens": 5314432} +{"current_steps": 4370, "total_steps": 179580, "loss": 0.2108, "lr": 1.216449493262056e-05, "epoch": 0.48669116828154585, "percentage": 2.43, "elapsed_time": "0:26:29", "remaining_time": "17:41:50", "throughput": 3347.91, "total_tokens": 5319968} +{"current_steps": 4375, "total_steps": 179580, "loss": 0.241, "lr": 1.2178416304710993e-05, "epoch": 0.48724802316516314, "percentage": 2.44, "elapsed_time": "0:26:30", "remaining_time": "17:41:43", "throughput": 3347.9, "total_tokens": 5325568} +{"current_steps": 4380, "total_steps": 179580, "loss": 0.0916, "lr": 1.2192337676801425e-05, "epoch": 0.4878048780487805, "percentage": 2.44, "elapsed_time": "0:26:32", "remaining_time": "17:41:39", "throughput": 3347.89, "total_tokens": 5331520} +{"current_steps": 4385, "total_steps": 179580, "loss": 0.1921, "lr": 1.220625904889186e-05, "epoch": 0.4883617329323978, "percentage": 2.44, "elapsed_time": "0:26:34", "remaining_time": "17:41:43", "throughput": 3347.94, "total_tokens": 5338144} +{"current_steps": 4390, "total_steps": 179580, "loss": 0.1592, "lr": 1.2220180420982292e-05, "epoch": 0.48891858781601516, "percentage": 2.44, "elapsed_time": "0:26:36", "remaining_time": "17:41:41", "throughput": 3347.96, "total_tokens": 5344224} +{"current_steps": 4395, "total_steps": 179580, "loss": 0.1313, "lr": 1.2234101793072727e-05, "epoch": 0.4894754426996325, "percentage": 2.45, "elapsed_time": "0:26:38", "remaining_time": "17:41:38", "throughput": 3347.93, "total_tokens": 5350208} +{"current_steps": 4400, "total_steps": 179580, "loss": 0.1981, "lr": 1.224802316516316e-05, "epoch": 0.4900322975832498, "percentage": 2.45, "elapsed_time": "0:26:39", "remaining_time": "17:41:40", "throughput": 3347.99, "total_tokens": 5356672} +{"current_steps": 4405, "total_steps": 179580, "loss": 0.1135, "lr": 1.2261944537253592e-05, "epoch": 0.49058915246686713, "percentage": 2.45, "elapsed_time": "0:26:41", "remaining_time": "17:41:38", "throughput": 3347.97, "total_tokens": 5362688} +{"current_steps": 4410, "total_steps": 179580, "loss": 0.2493, "lr": 1.2275865909344026e-05, "epoch": 0.49114600735048447, "percentage": 2.46, "elapsed_time": "0:26:43", "remaining_time": "17:41:37", "throughput": 3347.97, "total_tokens": 5368896} +{"current_steps": 4415, "total_steps": 179580, "loss": 0.1949, "lr": 1.2289787281434459e-05, "epoch": 0.4917028622341018, "percentage": 2.46, "elapsed_time": "0:26:45", "remaining_time": "17:41:36", "throughput": 3348.0, "total_tokens": 5375040} +{"current_steps": 4420, "total_steps": 179580, "loss": 0.2871, "lr": 1.2303708653524893e-05, "epoch": 0.4922597171177191, "percentage": 2.46, "elapsed_time": "0:26:47", "remaining_time": "17:41:37", "throughput": 3348.02, "total_tokens": 5381408} +{"current_steps": 4425, "total_steps": 179580, "loss": 0.1384, "lr": 1.2317630025615324e-05, "epoch": 0.49281657200133644, "percentage": 2.46, "elapsed_time": "0:26:49", "remaining_time": "17:41:38", "throughput": 3348.01, "total_tokens": 5387744} +{"current_steps": 4430, "total_steps": 179580, "loss": 0.2453, "lr": 1.2331551397705758e-05, "epoch": 0.4933734268849538, "percentage": 2.47, "elapsed_time": "0:26:51", "remaining_time": "17:41:38", "throughput": 3348.02, "total_tokens": 5394016} +{"current_steps": 4435, "total_steps": 179580, "loss": 0.1153, "lr": 1.2345472769796191e-05, "epoch": 0.4939302817685711, "percentage": 2.47, "elapsed_time": "0:26:53", "remaining_time": "17:41:42", "throughput": 3348.06, "total_tokens": 5400608} +{"current_steps": 4440, "total_steps": 179580, "loss": 0.1692, "lr": 1.2359394141886625e-05, "epoch": 0.49448713665218846, "percentage": 2.47, "elapsed_time": "0:26:54", "remaining_time": "17:41:42", "throughput": 3348.05, "total_tokens": 5406912} +{"current_steps": 4445, "total_steps": 179580, "loss": 0.3193, "lr": 1.2373315513977058e-05, "epoch": 0.49504399153580575, "percentage": 2.48, "elapsed_time": "0:26:56", "remaining_time": "17:41:39", "throughput": 3348.06, "total_tokens": 5412864} +{"current_steps": 4450, "total_steps": 179580, "loss": 0.2505, "lr": 1.238723688606749e-05, "epoch": 0.4956008464194231, "percentage": 2.48, "elapsed_time": "0:26:58", "remaining_time": "17:41:38", "throughput": 3348.03, "total_tokens": 5418944} +{"current_steps": 4455, "total_steps": 179580, "loss": 0.2253, "lr": 1.2401158258157925e-05, "epoch": 0.49615770130304043, "percentage": 2.48, "elapsed_time": "0:27:00", "remaining_time": "17:41:36", "throughput": 3347.99, "total_tokens": 5424992} +{"current_steps": 4460, "total_steps": 179580, "loss": 0.2373, "lr": 1.2415079630248358e-05, "epoch": 0.4967145561866578, "percentage": 2.48, "elapsed_time": "0:27:02", "remaining_time": "17:41:33", "throughput": 3348.01, "total_tokens": 5431008} +{"current_steps": 4465, "total_steps": 179580, "loss": 0.1427, "lr": 1.2429001002338792e-05, "epoch": 0.49727141107027506, "percentage": 2.49, "elapsed_time": "0:27:03", "remaining_time": "17:41:31", "throughput": 3347.96, "total_tokens": 5436992} +{"current_steps": 4470, "total_steps": 179580, "loss": 0.1671, "lr": 1.2442922374429223e-05, "epoch": 0.4978282659538924, "percentage": 2.49, "elapsed_time": "0:27:05", "remaining_time": "17:41:29", "throughput": 3347.95, "total_tokens": 5443104} +{"current_steps": 4475, "total_steps": 179580, "loss": 0.2712, "lr": 1.2456843746519657e-05, "epoch": 0.49838512083750974, "percentage": 2.49, "elapsed_time": "0:27:07", "remaining_time": "17:41:28", "throughput": 3347.98, "total_tokens": 5449248} +{"current_steps": 4480, "total_steps": 179580, "loss": 0.1994, "lr": 1.2470765118610092e-05, "epoch": 0.4989419757211271, "percentage": 2.49, "elapsed_time": "0:27:09", "remaining_time": "17:41:27", "throughput": 3347.98, "total_tokens": 5455392} +{"current_steps": 4485, "total_steps": 179580, "loss": 0.2247, "lr": 1.2484686490700524e-05, "epoch": 0.4994988306047444, "percentage": 2.5, "elapsed_time": "0:27:11", "remaining_time": "17:41:25", "throughput": 3347.96, "total_tokens": 5461504} +{"current_steps": 4490, "total_steps": 179580, "loss": 0.2464, "lr": 1.2498607862790959e-05, "epoch": 0.5000556854883618, "percentage": 2.5, "elapsed_time": "0:27:13", "remaining_time": "17:41:23", "throughput": 3347.95, "total_tokens": 5467520} +{"current_steps": 4495, "total_steps": 179580, "loss": 0.3309, "lr": 1.251252923488139e-05, "epoch": 0.5006125403719791, "percentage": 2.5, "elapsed_time": "0:27:14", "remaining_time": "17:41:22", "throughput": 3347.94, "total_tokens": 5473632} +{"current_steps": 4500, "total_steps": 179580, "loss": 0.2412, "lr": 1.2526450606971824e-05, "epoch": 0.5011693952555963, "percentage": 2.51, "elapsed_time": "0:27:16", "remaining_time": "17:41:13", "throughput": 3347.91, "total_tokens": 5479072} +{"current_steps": 4505, "total_steps": 179580, "loss": 0.4685, "lr": 1.2540371979062256e-05, "epoch": 0.5017262501392137, "percentage": 2.51, "elapsed_time": "0:27:18", "remaining_time": "17:41:11", "throughput": 3347.87, "total_tokens": 5485056} +{"current_steps": 4510, "total_steps": 179580, "loss": 0.1619, "lr": 1.255429335115269e-05, "epoch": 0.502283105022831, "percentage": 2.51, "elapsed_time": "0:27:20", "remaining_time": "17:41:11", "throughput": 3347.94, "total_tokens": 5491456} +{"current_steps": 4515, "total_steps": 179580, "loss": 0.2366, "lr": 1.2568214723243123e-05, "epoch": 0.5028399599064484, "percentage": 2.51, "elapsed_time": "0:27:22", "remaining_time": "17:41:10", "throughput": 3347.97, "total_tokens": 5497696} +{"current_steps": 4520, "total_steps": 179580, "loss": 0.2611, "lr": 1.2582136095333558e-05, "epoch": 0.5033968147900657, "percentage": 2.52, "elapsed_time": "0:27:23", "remaining_time": "17:41:06", "throughput": 3347.94, "total_tokens": 5503520} +{"current_steps": 4525, "total_steps": 179580, "loss": 0.27, "lr": 1.259605746742399e-05, "epoch": 0.503953669673683, "percentage": 2.52, "elapsed_time": "0:27:25", "remaining_time": "17:41:01", "throughput": 3347.89, "total_tokens": 5509280} +{"current_steps": 4530, "total_steps": 179580, "loss": 0.3434, "lr": 1.2609978839514421e-05, "epoch": 0.5045105245573004, "percentage": 2.52, "elapsed_time": "0:27:27", "remaining_time": "17:41:01", "throughput": 3347.95, "total_tokens": 5515584} +{"current_steps": 4535, "total_steps": 179580, "loss": 0.2319, "lr": 1.2623900211604856e-05, "epoch": 0.5050673794409177, "percentage": 2.53, "elapsed_time": "0:27:29", "remaining_time": "17:41:00", "throughput": 3347.93, "total_tokens": 5521760} +{"current_steps": 4540, "total_steps": 179580, "loss": 0.1012, "lr": 1.2637821583695288e-05, "epoch": 0.5056242343245351, "percentage": 2.53, "elapsed_time": "0:27:31", "remaining_time": "17:41:01", "throughput": 3347.95, "total_tokens": 5528128} +{"current_steps": 4545, "total_steps": 179580, "loss": 0.175, "lr": 1.2651742955785723e-05, "epoch": 0.5061810892081523, "percentage": 2.53, "elapsed_time": "0:27:33", "remaining_time": "17:40:59", "throughput": 3347.95, "total_tokens": 5534176} +{"current_steps": 4550, "total_steps": 179580, "loss": 0.2959, "lr": 1.2665664327876157e-05, "epoch": 0.5067379440917696, "percentage": 2.53, "elapsed_time": "0:27:34", "remaining_time": "17:40:58", "throughput": 3347.92, "total_tokens": 5540256} +{"current_steps": 4555, "total_steps": 179580, "loss": 0.0806, "lr": 1.267958569996659e-05, "epoch": 0.507294798975387, "percentage": 2.54, "elapsed_time": "0:27:36", "remaining_time": "17:40:59", "throughput": 3347.9, "total_tokens": 5546528} +{"current_steps": 4560, "total_steps": 179580, "loss": 0.2245, "lr": 1.2693507072057024e-05, "epoch": 0.5078516538590043, "percentage": 2.54, "elapsed_time": "0:27:38", "remaining_time": "17:40:53", "throughput": 3347.87, "total_tokens": 5552224} +{"current_steps": 4565, "total_steps": 179580, "loss": 0.2021, "lr": 1.2707428444147457e-05, "epoch": 0.5084085087426217, "percentage": 2.54, "elapsed_time": "0:27:40", "remaining_time": "17:40:55", "throughput": 3347.95, "total_tokens": 5558752} +{"current_steps": 4570, "total_steps": 179580, "loss": 0.1603, "lr": 1.272134981623789e-05, "epoch": 0.508965363626239, "percentage": 2.54, "elapsed_time": "0:27:42", "remaining_time": "17:40:53", "throughput": 3347.93, "total_tokens": 5564800} +{"current_steps": 4575, "total_steps": 179580, "loss": 0.2824, "lr": 1.2735271188328322e-05, "epoch": 0.5095222185098564, "percentage": 2.55, "elapsed_time": "0:27:43", "remaining_time": "17:40:43", "throughput": 3347.89, "total_tokens": 5570144} +{"current_steps": 4580, "total_steps": 179580, "loss": 0.3118, "lr": 1.2749192560418754e-05, "epoch": 0.5100790733934737, "percentage": 2.55, "elapsed_time": "0:27:45", "remaining_time": "17:40:44", "throughput": 3347.84, "total_tokens": 5576352} +{"current_steps": 4585, "total_steps": 179580, "loss": 0.3781, "lr": 1.2763113932509189e-05, "epoch": 0.510635928277091, "percentage": 2.55, "elapsed_time": "0:27:47", "remaining_time": "17:40:41", "throughput": 3347.88, "total_tokens": 5582464} +{"current_steps": 4590, "total_steps": 179580, "loss": 0.2983, "lr": 1.2777035304599621e-05, "epoch": 0.5111927831607083, "percentage": 2.56, "elapsed_time": "0:27:49", "remaining_time": "17:40:42", "throughput": 3347.57, "total_tokens": 5588288} +{"current_steps": 4595, "total_steps": 179580, "loss": 0.2704, "lr": 1.2790956676690056e-05, "epoch": 0.5117496380443256, "percentage": 2.56, "elapsed_time": "0:27:51", "remaining_time": "17:40:44", "throughput": 3347.62, "total_tokens": 5594752} +{"current_steps": 4600, "total_steps": 179580, "loss": 0.2528, "lr": 1.2804878048780488e-05, "epoch": 0.512306492927943, "percentage": 2.56, "elapsed_time": "0:27:53", "remaining_time": "17:40:45", "throughput": 3347.65, "total_tokens": 5601152} +{"current_steps": 4605, "total_steps": 179580, "loss": 0.2216, "lr": 1.2818799420870923e-05, "epoch": 0.5128633478115603, "percentage": 2.56, "elapsed_time": "0:27:54", "remaining_time": "17:40:44", "throughput": 3347.7, "total_tokens": 5607392} +{"current_steps": 4610, "total_steps": 179580, "loss": 0.2744, "lr": 1.2832720792961355e-05, "epoch": 0.5134202026951776, "percentage": 2.57, "elapsed_time": "0:27:56", "remaining_time": "17:40:43", "throughput": 3347.77, "total_tokens": 5613696} +{"current_steps": 4615, "total_steps": 179580, "loss": 0.2055, "lr": 1.284664216505179e-05, "epoch": 0.513977057578795, "percentage": 2.57, "elapsed_time": "0:27:58", "remaining_time": "17:40:42", "throughput": 3347.77, "total_tokens": 5619872} +{"current_steps": 4620, "total_steps": 179580, "loss": 0.0959, "lr": 1.286056353714222e-05, "epoch": 0.5145339124624123, "percentage": 2.57, "elapsed_time": "0:28:00", "remaining_time": "17:40:41", "throughput": 3347.78, "total_tokens": 5626048} +{"current_steps": 4625, "total_steps": 179580, "loss": 0.1693, "lr": 1.2874484909232653e-05, "epoch": 0.5150907673460297, "percentage": 2.58, "elapsed_time": "0:28:02", "remaining_time": "17:40:41", "throughput": 3347.76, "total_tokens": 5632224} +{"current_steps": 4630, "total_steps": 179580, "loss": 0.2768, "lr": 1.2888406281323088e-05, "epoch": 0.515647622229647, "percentage": 2.58, "elapsed_time": "0:28:04", "remaining_time": "17:40:35", "throughput": 3347.78, "total_tokens": 5638016} +{"current_steps": 4635, "total_steps": 179580, "loss": 0.5102, "lr": 1.290232765341352e-05, "epoch": 0.5162044771132643, "percentage": 2.58, "elapsed_time": "0:28:05", "remaining_time": "17:40:34", "throughput": 3347.78, "total_tokens": 5644160} +{"current_steps": 4640, "total_steps": 179580, "loss": 0.1287, "lr": 1.2916249025503954e-05, "epoch": 0.5167613319968816, "percentage": 2.58, "elapsed_time": "0:28:07", "remaining_time": "17:40:32", "throughput": 3347.81, "total_tokens": 5650272} +{"current_steps": 4645, "total_steps": 179580, "loss": 0.2107, "lr": 1.2930170397594387e-05, "epoch": 0.5173181868804989, "percentage": 2.59, "elapsed_time": "0:28:09", "remaining_time": "17:40:32", "throughput": 3347.83, "total_tokens": 5656576} +{"current_steps": 4650, "total_steps": 179580, "loss": 0.2563, "lr": 1.2944091769684821e-05, "epoch": 0.5178750417641163, "percentage": 2.59, "elapsed_time": "0:28:11", "remaining_time": "17:40:30", "throughput": 3347.81, "total_tokens": 5662592} +{"current_steps": 4655, "total_steps": 179580, "loss": 0.27, "lr": 1.2958013141775254e-05, "epoch": 0.5184318966477336, "percentage": 2.59, "elapsed_time": "0:28:13", "remaining_time": "17:40:29", "throughput": 3347.81, "total_tokens": 5668736} +{"current_steps": 4660, "total_steps": 179580, "loss": 0.1874, "lr": 1.2971934513865688e-05, "epoch": 0.5189887515313509, "percentage": 2.59, "elapsed_time": "0:28:15", "remaining_time": "17:40:28", "throughput": 3347.78, "total_tokens": 5674880} +{"current_steps": 4665, "total_steps": 179580, "loss": 0.2794, "lr": 1.298585588595612e-05, "epoch": 0.5195456064149683, "percentage": 2.6, "elapsed_time": "0:28:16", "remaining_time": "17:40:27", "throughput": 3347.78, "total_tokens": 5681056} +{"current_steps": 4670, "total_steps": 179580, "loss": 0.1578, "lr": 1.2999777258046552e-05, "epoch": 0.5201024612985856, "percentage": 2.6, "elapsed_time": "0:28:18", "remaining_time": "17:40:25", "throughput": 3347.79, "total_tokens": 5687136} +{"current_steps": 4675, "total_steps": 179580, "loss": 0.1269, "lr": 1.3013698630136986e-05, "epoch": 0.520659316182203, "percentage": 2.6, "elapsed_time": "0:28:20", "remaining_time": "17:40:23", "throughput": 3347.8, "total_tokens": 5693216} +{"current_steps": 4680, "total_steps": 179580, "loss": 0.1936, "lr": 1.3027620002227419e-05, "epoch": 0.5212161710658203, "percentage": 2.61, "elapsed_time": "0:28:22", "remaining_time": "17:40:21", "throughput": 3347.79, "total_tokens": 5699232} +{"current_steps": 4685, "total_steps": 179580, "loss": 0.3716, "lr": 1.3041541374317853e-05, "epoch": 0.5217730259494375, "percentage": 2.61, "elapsed_time": "0:28:24", "remaining_time": "17:40:19", "throughput": 3347.79, "total_tokens": 5705280} +{"current_steps": 4690, "total_steps": 179580, "loss": 0.222, "lr": 1.3055462746408288e-05, "epoch": 0.5223298808330549, "percentage": 2.61, "elapsed_time": "0:28:26", "remaining_time": "17:40:17", "throughput": 3347.8, "total_tokens": 5711456} +{"current_steps": 4695, "total_steps": 179580, "loss": 0.2699, "lr": 1.306938411849872e-05, "epoch": 0.5228867357166722, "percentage": 2.61, "elapsed_time": "0:28:27", "remaining_time": "17:40:15", "throughput": 3347.79, "total_tokens": 5717440} +{"current_steps": 4700, "total_steps": 179580, "loss": 0.1872, "lr": 1.3083305490589155e-05, "epoch": 0.5234435906002896, "percentage": 2.62, "elapsed_time": "0:28:29", "remaining_time": "17:40:12", "throughput": 3347.77, "total_tokens": 5723456} +{"current_steps": 4705, "total_steps": 179580, "loss": 0.1182, "lr": 1.3097226862679587e-05, "epoch": 0.5240004454839069, "percentage": 2.62, "elapsed_time": "0:28:31", "remaining_time": "17:40:12", "throughput": 3347.74, "total_tokens": 5729632} +{"current_steps": 4710, "total_steps": 179580, "loss": 0.3185, "lr": 1.3111148234770018e-05, "epoch": 0.5245573003675242, "percentage": 2.62, "elapsed_time": "0:28:33", "remaining_time": "17:40:13", "throughput": 3347.76, "total_tokens": 5736000} +{"current_steps": 4715, "total_steps": 179580, "loss": 0.1295, "lr": 1.3125069606860452e-05, "epoch": 0.5251141552511416, "percentage": 2.63, "elapsed_time": "0:28:35", "remaining_time": "17:40:10", "throughput": 3347.72, "total_tokens": 5741952} +{"current_steps": 4720, "total_steps": 179580, "loss": 0.288, "lr": 1.3138990978950885e-05, "epoch": 0.5256710101347589, "percentage": 2.63, "elapsed_time": "0:28:37", "remaining_time": "17:40:09", "throughput": 3347.75, "total_tokens": 5748160} +{"current_steps": 4725, "total_steps": 179580, "loss": 0.1955, "lr": 1.315291235104132e-05, "epoch": 0.5262278650183763, "percentage": 2.63, "elapsed_time": "0:28:38", "remaining_time": "17:40:07", "throughput": 3347.75, "total_tokens": 5754176} +{"current_steps": 4730, "total_steps": 179580, "loss": 0.1279, "lr": 1.3166833723131752e-05, "epoch": 0.5267847199019935, "percentage": 2.63, "elapsed_time": "0:28:40", "remaining_time": "17:40:05", "throughput": 3347.76, "total_tokens": 5760256} +{"current_steps": 4735, "total_steps": 179580, "loss": 0.122, "lr": 1.3180755095222186e-05, "epoch": 0.5273415747856108, "percentage": 2.64, "elapsed_time": "0:28:42", "remaining_time": "17:40:02", "throughput": 3347.81, "total_tokens": 5766336} +{"current_steps": 4740, "total_steps": 179580, "loss": 0.1014, "lr": 1.3194676467312619e-05, "epoch": 0.5278984296692282, "percentage": 2.64, "elapsed_time": "0:28:44", "remaining_time": "17:40:03", "throughput": 3347.8, "total_tokens": 5772736} +{"current_steps": 4745, "total_steps": 179580, "loss": 0.3115, "lr": 1.3208597839403053e-05, "epoch": 0.5284552845528455, "percentage": 2.64, "elapsed_time": "0:28:46", "remaining_time": "17:40:01", "throughput": 3347.8, "total_tokens": 5778784} +{"current_steps": 4750, "total_steps": 179580, "loss": 0.3534, "lr": 1.3222519211493486e-05, "epoch": 0.5290121394364629, "percentage": 2.65, "elapsed_time": "0:28:47", "remaining_time": "17:40:00", "throughput": 3347.82, "total_tokens": 5784992} +{"current_steps": 4755, "total_steps": 179580, "loss": 0.3354, "lr": 1.323644058358392e-05, "epoch": 0.5295689943200802, "percentage": 2.65, "elapsed_time": "0:28:49", "remaining_time": "17:39:58", "throughput": 3347.84, "total_tokens": 5791072} +{"current_steps": 4760, "total_steps": 179580, "loss": 0.118, "lr": 1.3250361955674351e-05, "epoch": 0.5301258492036975, "percentage": 2.65, "elapsed_time": "0:28:51", "remaining_time": "17:39:57", "throughput": 3347.85, "total_tokens": 5797248} +{"current_steps": 4765, "total_steps": 179580, "loss": 0.2154, "lr": 1.3264283327764784e-05, "epoch": 0.5306827040873149, "percentage": 2.65, "elapsed_time": "0:28:53", "remaining_time": "17:39:59", "throughput": 3347.85, "total_tokens": 5803648} +{"current_steps": 4770, "total_steps": 179580, "loss": 0.343, "lr": 1.3278204699855218e-05, "epoch": 0.5312395589709322, "percentage": 2.66, "elapsed_time": "0:28:55", "remaining_time": "17:39:57", "throughput": 3347.87, "total_tokens": 5809760} +{"current_steps": 4775, "total_steps": 179580, "loss": 0.4062, "lr": 1.3292126071945651e-05, "epoch": 0.5317964138545495, "percentage": 2.66, "elapsed_time": "0:28:57", "remaining_time": "17:39:54", "throughput": 3347.83, "total_tokens": 5815744} +{"current_steps": 4780, "total_steps": 179580, "loss": 0.1787, "lr": 1.3306047444036085e-05, "epoch": 0.5323532687381668, "percentage": 2.66, "elapsed_time": "0:28:59", "remaining_time": "17:39:54", "throughput": 3347.82, "total_tokens": 5821984} +{"current_steps": 4785, "total_steps": 179580, "loss": 0.1936, "lr": 1.3319968816126518e-05, "epoch": 0.5329101236217841, "percentage": 2.66, "elapsed_time": "0:29:00", "remaining_time": "17:39:52", "throughput": 3347.86, "total_tokens": 5828128} +{"current_steps": 4790, "total_steps": 179580, "loss": 0.309, "lr": 1.3333890188216952e-05, "epoch": 0.5334669785054015, "percentage": 2.67, "elapsed_time": "0:29:02", "remaining_time": "17:39:49", "throughput": 3347.84, "total_tokens": 5834016} +{"current_steps": 4795, "total_steps": 179580, "loss": 0.1421, "lr": 1.3347811560307385e-05, "epoch": 0.5340238333890188, "percentage": 2.67, "elapsed_time": "0:29:04", "remaining_time": "17:39:48", "throughput": 3347.88, "total_tokens": 5840256} +{"current_steps": 4800, "total_steps": 179580, "loss": 0.2883, "lr": 1.3361732932397819e-05, "epoch": 0.5345806882726362, "percentage": 2.67, "elapsed_time": "0:29:06", "remaining_time": "17:39:44", "throughput": 3347.88, "total_tokens": 5846112} +{"current_steps": 4805, "total_steps": 179580, "loss": 0.1884, "lr": 1.337565430448825e-05, "epoch": 0.5351375431562535, "percentage": 2.68, "elapsed_time": "0:29:07", "remaining_time": "17:39:40", "throughput": 3347.87, "total_tokens": 5852032} +{"current_steps": 4810, "total_steps": 179580, "loss": 0.225, "lr": 1.3389575676578683e-05, "epoch": 0.5356943980398708, "percentage": 2.68, "elapsed_time": "0:29:09", "remaining_time": "17:39:32", "throughput": 3347.8, "total_tokens": 5857408} +{"current_steps": 4815, "total_steps": 179580, "loss": 0.2627, "lr": 1.3403497048669117e-05, "epoch": 0.5362512529234882, "percentage": 2.68, "elapsed_time": "0:29:11", "remaining_time": "17:39:30", "throughput": 3347.82, "total_tokens": 5863584} +{"current_steps": 4820, "total_steps": 179580, "loss": 0.1871, "lr": 1.341741842075955e-05, "epoch": 0.5368081078071054, "percentage": 2.68, "elapsed_time": "0:29:13", "remaining_time": "17:39:29", "throughput": 3347.81, "total_tokens": 5869664} +{"current_steps": 4825, "total_steps": 179580, "loss": 0.2633, "lr": 1.3431339792849984e-05, "epoch": 0.5373649626907228, "percentage": 2.69, "elapsed_time": "0:29:15", "remaining_time": "17:39:28", "throughput": 3347.82, "total_tokens": 5875840} +{"current_steps": 4830, "total_steps": 179580, "loss": 0.2619, "lr": 1.3445261164940418e-05, "epoch": 0.5379218175743401, "percentage": 2.69, "elapsed_time": "0:29:16", "remaining_time": "17:39:27", "throughput": 3347.84, "total_tokens": 5882048} +{"current_steps": 4835, "total_steps": 179580, "loss": 0.1477, "lr": 1.3459182537030851e-05, "epoch": 0.5384786724579574, "percentage": 2.69, "elapsed_time": "0:29:18", "remaining_time": "17:39:26", "throughput": 3347.86, "total_tokens": 5888256} +{"current_steps": 4840, "total_steps": 179580, "loss": 0.2666, "lr": 1.3473103909121285e-05, "epoch": 0.5390355273415748, "percentage": 2.7, "elapsed_time": "0:29:20", "remaining_time": "17:39:25", "throughput": 3347.84, "total_tokens": 5894368} +{"current_steps": 4845, "total_steps": 179580, "loss": 0.1345, "lr": 1.3487025281211718e-05, "epoch": 0.5395923822251921, "percentage": 2.7, "elapsed_time": "0:29:22", "remaining_time": "17:39:19", "throughput": 3347.79, "total_tokens": 5900000} +{"current_steps": 4850, "total_steps": 179580, "loss": 0.1397, "lr": 1.3500946653302149e-05, "epoch": 0.5401492371088095, "percentage": 2.7, "elapsed_time": "0:29:24", "remaining_time": "17:39:17", "throughput": 3347.76, "total_tokens": 5906048} +{"current_steps": 4855, "total_steps": 179580, "loss": 0.1686, "lr": 1.3514868025392583e-05, "epoch": 0.5407060919924268, "percentage": 2.7, "elapsed_time": "0:29:26", "remaining_time": "17:39:18", "throughput": 3347.78, "total_tokens": 5912448} +{"current_steps": 4860, "total_steps": 179580, "loss": 0.1144, "lr": 1.3528789397483016e-05, "epoch": 0.5412629468760441, "percentage": 2.71, "elapsed_time": "0:29:27", "remaining_time": "17:39:18", "throughput": 3347.78, "total_tokens": 5918656} +{"current_steps": 4865, "total_steps": 179580, "loss": 0.2748, "lr": 1.354271076957345e-05, "epoch": 0.5418198017596614, "percentage": 2.71, "elapsed_time": "0:29:29", "remaining_time": "17:39:16", "throughput": 3347.74, "total_tokens": 5924672} +{"current_steps": 4870, "total_steps": 179580, "loss": 0.1148, "lr": 1.3556632141663883e-05, "epoch": 0.5423766566432787, "percentage": 2.71, "elapsed_time": "0:29:31", "remaining_time": "17:39:14", "throughput": 3347.73, "total_tokens": 5930688} +{"current_steps": 4875, "total_steps": 179580, "loss": 0.1322, "lr": 1.3570553513754317e-05, "epoch": 0.5429335115268961, "percentage": 2.71, "elapsed_time": "0:29:33", "remaining_time": "17:39:12", "throughput": 3347.72, "total_tokens": 5936800} +{"current_steps": 4880, "total_steps": 179580, "loss": 0.0587, "lr": 1.358447488584475e-05, "epoch": 0.5434903664105134, "percentage": 2.72, "elapsed_time": "0:29:35", "remaining_time": "17:39:12", "throughput": 3347.76, "total_tokens": 5943072} +{"current_steps": 4885, "total_steps": 179580, "loss": 0.2369, "lr": 1.3598396257935184e-05, "epoch": 0.5440472212941307, "percentage": 2.72, "elapsed_time": "0:29:37", "remaining_time": "17:39:11", "throughput": 3347.8, "total_tokens": 5949312} +{"current_steps": 4890, "total_steps": 179580, "loss": 0.1595, "lr": 1.3612317630025617e-05, "epoch": 0.5446040761777481, "percentage": 2.72, "elapsed_time": "0:29:38", "remaining_time": "17:39:11", "throughput": 3347.85, "total_tokens": 5955712} +{"current_steps": 4895, "total_steps": 179580, "loss": 0.422, "lr": 1.3626239002116048e-05, "epoch": 0.5451609310613654, "percentage": 2.73, "elapsed_time": "0:29:40", "remaining_time": "17:39:15", "throughput": 3347.89, "total_tokens": 5962432} +{"current_steps": 4900, "total_steps": 179580, "loss": 0.1874, "lr": 1.3640160374206482e-05, "epoch": 0.5457177859449828, "percentage": 2.73, "elapsed_time": "0:29:42", "remaining_time": "17:39:13", "throughput": 3347.88, "total_tokens": 5968416} +{"current_steps": 4905, "total_steps": 179580, "loss": 0.191, "lr": 1.3654081746296915e-05, "epoch": 0.5462746408286001, "percentage": 2.73, "elapsed_time": "0:29:44", "remaining_time": "17:39:14", "throughput": 3347.9, "total_tokens": 5974816} +{"current_steps": 4910, "total_steps": 179580, "loss": 0.2073, "lr": 1.3668003118387349e-05, "epoch": 0.5468314957122173, "percentage": 2.73, "elapsed_time": "0:29:46", "remaining_time": "17:39:11", "throughput": 3347.91, "total_tokens": 5980864} +{"current_steps": 4915, "total_steps": 179580, "loss": 0.2179, "lr": 1.3681924490477782e-05, "epoch": 0.5473883505958347, "percentage": 2.74, "elapsed_time": "0:29:48", "remaining_time": "17:39:02", "throughput": 3347.82, "total_tokens": 5986144} +{"current_steps": 4920, "total_steps": 179580, "loss": 0.0889, "lr": 1.3695845862568216e-05, "epoch": 0.547945205479452, "percentage": 2.74, "elapsed_time": "0:29:50", "remaining_time": "17:39:05", "throughput": 3347.85, "total_tokens": 5992672} +{"current_steps": 4925, "total_steps": 179580, "loss": 0.2517, "lr": 1.3709767234658649e-05, "epoch": 0.5485020603630694, "percentage": 2.74, "elapsed_time": "0:29:51", "remaining_time": "17:38:58", "throughput": 3347.78, "total_tokens": 5998176} +{"current_steps": 4930, "total_steps": 179580, "loss": 0.1874, "lr": 1.3723688606749083e-05, "epoch": 0.5490589152466867, "percentage": 2.75, "elapsed_time": "0:29:53", "remaining_time": "17:38:54", "throughput": 3347.79, "total_tokens": 6004064} +{"current_steps": 4935, "total_steps": 179580, "loss": 0.2527, "lr": 1.3737609978839515e-05, "epoch": 0.549615770130304, "percentage": 2.75, "elapsed_time": "0:29:55", "remaining_time": "17:38:56", "throughput": 3347.87, "total_tokens": 6010688} +{"current_steps": 4940, "total_steps": 179580, "loss": 0.214, "lr": 1.3751531350929946e-05, "epoch": 0.5501726250139214, "percentage": 2.75, "elapsed_time": "0:29:57", "remaining_time": "17:38:55", "throughput": 3347.89, "total_tokens": 6016896} +{"current_steps": 4945, "total_steps": 179580, "loss": 0.2896, "lr": 1.376545272302038e-05, "epoch": 0.5507294798975387, "percentage": 2.75, "elapsed_time": "0:29:58", "remaining_time": "17:38:52", "throughput": 3347.9, "total_tokens": 6022848} +{"current_steps": 4950, "total_steps": 179580, "loss": 0.2286, "lr": 1.3779374095110813e-05, "epoch": 0.5512863347811561, "percentage": 2.76, "elapsed_time": "0:30:00", "remaining_time": "17:38:52", "throughput": 3347.95, "total_tokens": 6029216} +{"current_steps": 4955, "total_steps": 179580, "loss": 0.115, "lr": 1.3793295467201248e-05, "epoch": 0.5518431896647734, "percentage": 2.76, "elapsed_time": "0:30:02", "remaining_time": "17:38:51", "throughput": 3347.94, "total_tokens": 6035360} +{"current_steps": 4960, "total_steps": 179580, "loss": 0.1743, "lr": 1.380721683929168e-05, "epoch": 0.5524000445483906, "percentage": 2.76, "elapsed_time": "0:30:04", "remaining_time": "17:38:51", "throughput": 3347.95, "total_tokens": 6041632} +{"current_steps": 4965, "total_steps": 179580, "loss": 0.1619, "lr": 1.3821138211382115e-05, "epoch": 0.552956899432008, "percentage": 2.76, "elapsed_time": "0:30:06", "remaining_time": "17:38:48", "throughput": 3347.97, "total_tokens": 6047712} +{"current_steps": 4970, "total_steps": 179580, "loss": 0.2399, "lr": 1.3835059583472549e-05, "epoch": 0.5535137543156253, "percentage": 2.77, "elapsed_time": "0:30:08", "remaining_time": "17:38:47", "throughput": 3347.96, "total_tokens": 6053792} +{"current_steps": 4975, "total_steps": 179580, "loss": 0.1381, "lr": 1.3848980955562982e-05, "epoch": 0.5540706091992427, "percentage": 2.77, "elapsed_time": "0:30:10", "remaining_time": "17:38:45", "throughput": 3347.96, "total_tokens": 6059904} +{"current_steps": 4980, "total_steps": 179580, "loss": 0.1904, "lr": 1.3862902327653416e-05, "epoch": 0.55462746408286, "percentage": 2.77, "elapsed_time": "0:30:11", "remaining_time": "17:38:47", "throughput": 3347.98, "total_tokens": 6066336} +{"current_steps": 4985, "total_steps": 179580, "loss": 0.0776, "lr": 1.3876823699743847e-05, "epoch": 0.5551843189664774, "percentage": 2.78, "elapsed_time": "0:30:13", "remaining_time": "17:38:45", "throughput": 3347.97, "total_tokens": 6072448} +{"current_steps": 4990, "total_steps": 179580, "loss": 0.1895, "lr": 1.389074507183428e-05, "epoch": 0.5557411738500947, "percentage": 2.78, "elapsed_time": "0:30:15", "remaining_time": "17:38:43", "throughput": 3347.95, "total_tokens": 6078464} +{"current_steps": 4995, "total_steps": 179580, "loss": 0.5285, "lr": 1.3904666443924714e-05, "epoch": 0.556298028733712, "percentage": 2.78, "elapsed_time": "0:30:17", "remaining_time": "17:38:40", "throughput": 3347.94, "total_tokens": 6084480} +{"current_steps": 5000, "total_steps": 179580, "loss": 0.4259, "lr": 1.3918587816015147e-05, "epoch": 0.5568548836173294, "percentage": 2.78, "elapsed_time": "0:30:19", "remaining_time": "17:38:40", "throughput": 3347.97, "total_tokens": 6090784} +{"current_steps": 5005, "total_steps": 179580, "loss": 0.4717, "lr": 1.3932509188105581e-05, "epoch": 0.5574117385009466, "percentage": 2.79, "elapsed_time": "0:30:20", "remaining_time": "17:38:36", "throughput": 3347.96, "total_tokens": 6096608} +{"current_steps": 5010, "total_steps": 179580, "loss": 0.2554, "lr": 1.3946430560196013e-05, "epoch": 0.557968593384564, "percentage": 2.79, "elapsed_time": "0:30:22", "remaining_time": "17:38:35", "throughput": 3347.94, "total_tokens": 6102784} +{"current_steps": 5015, "total_steps": 179580, "loss": 0.3093, "lr": 1.3960351932286448e-05, "epoch": 0.5585254482681813, "percentage": 2.79, "elapsed_time": "0:30:24", "remaining_time": "17:38:33", "throughput": 3347.99, "total_tokens": 6108864} +{"current_steps": 5020, "total_steps": 179580, "loss": 0.1669, "lr": 1.397427330437688e-05, "epoch": 0.5590823031517986, "percentage": 2.8, "elapsed_time": "0:30:26", "remaining_time": "17:38:30", "throughput": 3347.96, "total_tokens": 6114848} +{"current_steps": 5025, "total_steps": 179580, "loss": 0.1761, "lr": 1.3988194676467315e-05, "epoch": 0.559639158035416, "percentage": 2.8, "elapsed_time": "0:30:28", "remaining_time": "17:38:29", "throughput": 3347.96, "total_tokens": 6120992} +{"current_steps": 5030, "total_steps": 179580, "loss": 0.1655, "lr": 1.4002116048557746e-05, "epoch": 0.5601960129190333, "percentage": 2.8, "elapsed_time": "0:30:29", "remaining_time": "17:38:21", "throughput": 3347.94, "total_tokens": 6126432} +{"current_steps": 5035, "total_steps": 179580, "loss": 0.2022, "lr": 1.4016037420648178e-05, "epoch": 0.5607528678026507, "percentage": 2.8, "elapsed_time": "0:30:31", "remaining_time": "17:38:19", "throughput": 3347.91, "total_tokens": 6132512} +{"current_steps": 5040, "total_steps": 179580, "loss": 0.0552, "lr": 1.4029958792738613e-05, "epoch": 0.561309722686268, "percentage": 2.81, "elapsed_time": "0:30:33", "remaining_time": "17:38:17", "throughput": 3347.87, "total_tokens": 6138464} +{"current_steps": 5045, "total_steps": 179580, "loss": 0.2645, "lr": 1.4043880164829045e-05, "epoch": 0.5618665775698853, "percentage": 2.81, "elapsed_time": "0:30:35", "remaining_time": "17:38:19", "throughput": 3347.81, "total_tokens": 6144800} +{"current_steps": 5050, "total_steps": 179580, "loss": 0.3082, "lr": 1.405780153691948e-05, "epoch": 0.5624234324535026, "percentage": 2.81, "elapsed_time": "0:30:37", "remaining_time": "17:38:17", "throughput": 3347.79, "total_tokens": 6150880} +{"current_steps": 5055, "total_steps": 179580, "loss": 0.2837, "lr": 1.4071722909009912e-05, "epoch": 0.5629802873371199, "percentage": 2.81, "elapsed_time": "0:30:39", "remaining_time": "17:38:14", "throughput": 3347.76, "total_tokens": 6156832} +{"current_steps": 5060, "total_steps": 179580, "loss": 0.1771, "lr": 1.4085644281100347e-05, "epoch": 0.5635371422207373, "percentage": 2.82, "elapsed_time": "0:30:40", "remaining_time": "17:38:11", "throughput": 3347.74, "total_tokens": 6162720} +{"current_steps": 5065, "total_steps": 179580, "loss": 0.5084, "lr": 1.409956565319078e-05, "epoch": 0.5640939971043546, "percentage": 2.82, "elapsed_time": "0:30:42", "remaining_time": "17:38:08", "throughput": 3347.73, "total_tokens": 6168640} +{"current_steps": 5070, "total_steps": 179580, "loss": 0.2277, "lr": 1.4113487025281214e-05, "epoch": 0.5646508519879719, "percentage": 2.82, "elapsed_time": "0:30:44", "remaining_time": "17:38:06", "throughput": 3347.77, "total_tokens": 6174816} +{"current_steps": 5075, "total_steps": 179580, "loss": 0.3782, "lr": 1.4127408397371646e-05, "epoch": 0.5652077068715893, "percentage": 2.83, "elapsed_time": "0:30:46", "remaining_time": "17:38:01", "throughput": 3347.71, "total_tokens": 6180448} +{"current_steps": 5080, "total_steps": 179580, "loss": 0.3557, "lr": 1.4141329769462077e-05, "epoch": 0.5657645617552066, "percentage": 2.83, "elapsed_time": "0:30:47", "remaining_time": "17:37:58", "throughput": 3347.65, "total_tokens": 6186336} +{"current_steps": 5085, "total_steps": 179580, "loss": 0.2869, "lr": 1.4155251141552511e-05, "epoch": 0.566321416638824, "percentage": 2.83, "elapsed_time": "0:30:49", "remaining_time": "17:37:54", "throughput": 3347.65, "total_tokens": 6192256} +{"current_steps": 5090, "total_steps": 179580, "loss": 0.1907, "lr": 1.4169172513642944e-05, "epoch": 0.5668782715224413, "percentage": 2.83, "elapsed_time": "0:30:51", "remaining_time": "17:37:45", "throughput": 3347.62, "total_tokens": 6197600} +{"current_steps": 5095, "total_steps": 179580, "loss": 0.099, "lr": 1.4183093885733378e-05, "epoch": 0.5674351264060585, "percentage": 2.84, "elapsed_time": "0:30:53", "remaining_time": "17:37:44", "throughput": 3347.63, "total_tokens": 6203776} +{"current_steps": 5100, "total_steps": 179580, "loss": 0.4431, "lr": 1.4197015257823813e-05, "epoch": 0.5679919812896759, "percentage": 2.84, "elapsed_time": "0:30:54", "remaining_time": "17:37:37", "throughput": 3347.65, "total_tokens": 6209408} +{"current_steps": 5105, "total_steps": 179580, "loss": 0.1079, "lr": 1.4210936629914245e-05, "epoch": 0.5685488361732932, "percentage": 2.84, "elapsed_time": "0:30:56", "remaining_time": "17:37:34", "throughput": 3347.65, "total_tokens": 6215360} +{"current_steps": 5110, "total_steps": 179580, "loss": 0.3418, "lr": 1.422485800200468e-05, "epoch": 0.5691056910569106, "percentage": 2.85, "elapsed_time": "0:30:58", "remaining_time": "17:37:27", "throughput": 3347.65, "total_tokens": 6220960} +{"current_steps": 5115, "total_steps": 179580, "loss": 0.2479, "lr": 1.4238779374095112e-05, "epoch": 0.5696625459405279, "percentage": 2.85, "elapsed_time": "0:31:00", "remaining_time": "17:37:26", "throughput": 3347.67, "total_tokens": 6227168} +{"current_steps": 5120, "total_steps": 179580, "loss": 0.3591, "lr": 1.4252700746185547e-05, "epoch": 0.5702194008241452, "percentage": 2.85, "elapsed_time": "0:31:01", "remaining_time": "17:37:23", "throughput": 3347.63, "total_tokens": 6233024} +{"current_steps": 5125, "total_steps": 179580, "loss": 0.0983, "lr": 1.4266622118275978e-05, "epoch": 0.5707762557077626, "percentage": 2.85, "elapsed_time": "0:31:03", "remaining_time": "17:37:19", "throughput": 3347.63, "total_tokens": 6238880} +{"current_steps": 5130, "total_steps": 179580, "loss": 0.2874, "lr": 1.428054349036641e-05, "epoch": 0.5713331105913799, "percentage": 2.86, "elapsed_time": "0:31:05", "remaining_time": "17:37:18", "throughput": 3347.65, "total_tokens": 6245056} +{"current_steps": 5135, "total_steps": 179580, "loss": 0.0548, "lr": 1.4294464862456845e-05, "epoch": 0.5718899654749973, "percentage": 2.86, "elapsed_time": "0:31:07", "remaining_time": "17:37:19", "throughput": 3347.69, "total_tokens": 6251520} +{"current_steps": 5140, "total_steps": 179580, "loss": 0.2952, "lr": 1.4308386234547277e-05, "epoch": 0.5724468203586145, "percentage": 2.86, "elapsed_time": "0:31:09", "remaining_time": "17:37:17", "throughput": 3347.72, "total_tokens": 6257632} +{"current_steps": 5145, "total_steps": 179580, "loss": 0.2333, "lr": 1.4322307606637712e-05, "epoch": 0.5730036752422318, "percentage": 2.87, "elapsed_time": "0:31:11", "remaining_time": "17:37:16", "throughput": 3347.74, "total_tokens": 6263904} +{"current_steps": 5150, "total_steps": 179580, "loss": 0.2228, "lr": 1.4336228978728144e-05, "epoch": 0.5735605301258492, "percentage": 2.87, "elapsed_time": "0:31:12", "remaining_time": "17:37:12", "throughput": 3347.71, "total_tokens": 6269728} +{"current_steps": 5155, "total_steps": 179580, "loss": 0.1578, "lr": 1.4350150350818579e-05, "epoch": 0.5741173850094665, "percentage": 2.87, "elapsed_time": "0:31:14", "remaining_time": "17:37:11", "throughput": 3347.67, "total_tokens": 6275744} +{"current_steps": 5160, "total_steps": 179580, "loss": 0.0987, "lr": 1.4364071722909011e-05, "epoch": 0.5746742398930839, "percentage": 2.87, "elapsed_time": "0:31:16", "remaining_time": "17:37:08", "throughput": 3347.65, "total_tokens": 6281696} +{"current_steps": 5165, "total_steps": 179580, "loss": 0.3018, "lr": 1.4377993094999445e-05, "epoch": 0.5752310947767012, "percentage": 2.88, "elapsed_time": "0:31:18", "remaining_time": "17:37:07", "throughput": 3347.65, "total_tokens": 6287840} +{"current_steps": 5170, "total_steps": 179580, "loss": 0.1505, "lr": 1.4391914467089876e-05, "epoch": 0.5757879496603185, "percentage": 2.88, "elapsed_time": "0:31:19", "remaining_time": "17:37:01", "throughput": 3347.61, "total_tokens": 6293472} +{"current_steps": 5175, "total_steps": 179580, "loss": 0.2122, "lr": 1.4405835839180309e-05, "epoch": 0.5763448045439359, "percentage": 2.88, "elapsed_time": "0:31:21", "remaining_time": "17:36:59", "throughput": 3347.59, "total_tokens": 6299456} +{"current_steps": 5180, "total_steps": 179580, "loss": 0.1378, "lr": 1.4419757211270743e-05, "epoch": 0.5769016594275532, "percentage": 2.88, "elapsed_time": "0:31:23", "remaining_time": "17:36:56", "throughput": 3347.58, "total_tokens": 6305472} +{"current_steps": 5185, "total_steps": 179580, "loss": 0.2175, "lr": 1.4433678583361176e-05, "epoch": 0.5774585143111705, "percentage": 2.89, "elapsed_time": "0:31:25", "remaining_time": "17:36:55", "throughput": 3347.58, "total_tokens": 6311616} +{"current_steps": 5190, "total_steps": 179580, "loss": 0.3394, "lr": 1.444759995545161e-05, "epoch": 0.5780153691947878, "percentage": 2.89, "elapsed_time": "0:31:27", "remaining_time": "17:36:53", "throughput": 3347.63, "total_tokens": 6317760} +{"current_steps": 5195, "total_steps": 179580, "loss": 0.4676, "lr": 1.4461521327542043e-05, "epoch": 0.5785722240784051, "percentage": 2.89, "elapsed_time": "0:31:29", "remaining_time": "17:36:52", "throughput": 3347.64, "total_tokens": 6324032} +{"current_steps": 5200, "total_steps": 179580, "loss": 0.3574, "lr": 1.4475442699632477e-05, "epoch": 0.5791290789620225, "percentage": 2.9, "elapsed_time": "0:31:30", "remaining_time": "17:36:50", "throughput": 3347.69, "total_tokens": 6330176} +{"current_steps": 5205, "total_steps": 179580, "loss": 0.2399, "lr": 1.448936407172291e-05, "epoch": 0.5796859338456398, "percentage": 2.9, "elapsed_time": "0:31:32", "remaining_time": "17:36:46", "throughput": 3347.69, "total_tokens": 6336000} +{"current_steps": 5210, "total_steps": 179580, "loss": 0.2099, "lr": 1.4503285443813344e-05, "epoch": 0.5802427887292572, "percentage": 2.9, "elapsed_time": "0:31:34", "remaining_time": "17:36:39", "throughput": 3347.68, "total_tokens": 6341536} +{"current_steps": 5215, "total_steps": 179580, "loss": 0.311, "lr": 1.4517206815903775e-05, "epoch": 0.5807996436128745, "percentage": 2.9, "elapsed_time": "0:31:36", "remaining_time": "17:36:33", "throughput": 3347.64, "total_tokens": 6347136} +{"current_steps": 5220, "total_steps": 179580, "loss": 0.2362, "lr": 1.4531128187994208e-05, "epoch": 0.5813564984964918, "percentage": 2.91, "elapsed_time": "0:31:37", "remaining_time": "17:36:28", "throughput": 3347.57, "total_tokens": 6352736} +{"current_steps": 5225, "total_steps": 179580, "loss": 0.1379, "lr": 1.4545049560084642e-05, "epoch": 0.5819133533801092, "percentage": 2.91, "elapsed_time": "0:31:39", "remaining_time": "17:36:27", "throughput": 3347.54, "total_tokens": 6358912} +{"current_steps": 5230, "total_steps": 179580, "loss": 0.1348, "lr": 1.4558970932175075e-05, "epoch": 0.5824702082637264, "percentage": 2.91, "elapsed_time": "0:31:41", "remaining_time": "17:36:24", "throughput": 3347.56, "total_tokens": 6364928} +{"current_steps": 5235, "total_steps": 179580, "loss": 0.1541, "lr": 1.4572892304265509e-05, "epoch": 0.5830270631473438, "percentage": 2.92, "elapsed_time": "0:31:43", "remaining_time": "17:36:21", "throughput": 3347.57, "total_tokens": 6370912} +{"current_steps": 5240, "total_steps": 179580, "loss": 0.1596, "lr": 1.4586813676355943e-05, "epoch": 0.5835839180309611, "percentage": 2.92, "elapsed_time": "0:31:44", "remaining_time": "17:36:20", "throughput": 3347.59, "total_tokens": 6377088} +{"current_steps": 5245, "total_steps": 179580, "loss": 0.1164, "lr": 1.4600735048446376e-05, "epoch": 0.5841407729145784, "percentage": 2.92, "elapsed_time": "0:31:46", "remaining_time": "17:36:18", "throughput": 3347.58, "total_tokens": 6383104} +{"current_steps": 5250, "total_steps": 179580, "loss": 0.1416, "lr": 1.461465642053681e-05, "epoch": 0.5846976277981958, "percentage": 2.92, "elapsed_time": "0:31:48", "remaining_time": "17:36:19", "throughput": 3347.58, "total_tokens": 6389504} +{"current_steps": 5255, "total_steps": 179580, "loss": 0.3934, "lr": 1.4628577792627243e-05, "epoch": 0.5852544826818131, "percentage": 2.93, "elapsed_time": "0:31:50", "remaining_time": "17:36:17", "throughput": 3347.57, "total_tokens": 6395552} +{"current_steps": 5260, "total_steps": 179580, "loss": 0.3132, "lr": 1.4642499164717674e-05, "epoch": 0.5858113375654305, "percentage": 2.93, "elapsed_time": "0:31:52", "remaining_time": "17:36:17", "throughput": 3347.59, "total_tokens": 6401856} +{"current_steps": 5265, "total_steps": 179580, "loss": 0.3303, "lr": 1.4656420536808108e-05, "epoch": 0.5863681924490478, "percentage": 2.93, "elapsed_time": "0:31:54", "remaining_time": "17:36:14", "throughput": 3347.6, "total_tokens": 6407840} +{"current_steps": 5270, "total_steps": 179580, "loss": 0.1314, "lr": 1.4670341908898541e-05, "epoch": 0.5869250473326652, "percentage": 2.93, "elapsed_time": "0:31:55", "remaining_time": "17:36:13", "throughput": 3347.58, "total_tokens": 6413920} +{"current_steps": 5275, "total_steps": 179580, "loss": 0.2552, "lr": 1.4684263280988975e-05, "epoch": 0.5874819022162825, "percentage": 2.94, "elapsed_time": "0:31:57", "remaining_time": "17:36:10", "throughput": 3347.53, "total_tokens": 6419872} +{"current_steps": 5280, "total_steps": 179580, "loss": 0.1864, "lr": 1.4698184653079408e-05, "epoch": 0.5880387570998997, "percentage": 2.94, "elapsed_time": "0:31:59", "remaining_time": "17:36:04", "throughput": 3347.53, "total_tokens": 6425472} +{"current_steps": 5285, "total_steps": 179580, "loss": 0.2364, "lr": 1.4712106025169842e-05, "epoch": 0.5885956119835171, "percentage": 2.94, "elapsed_time": "0:32:01", "remaining_time": "17:36:03", "throughput": 3347.52, "total_tokens": 6431680} +{"current_steps": 5290, "total_steps": 179580, "loss": 0.3065, "lr": 1.4726027397260275e-05, "epoch": 0.5891524668671344, "percentage": 2.95, "elapsed_time": "0:32:03", "remaining_time": "17:36:02", "throughput": 3347.52, "total_tokens": 6437824} +{"current_steps": 5295, "total_steps": 179580, "loss": 0.2259, "lr": 1.473994876935071e-05, "epoch": 0.5897093217507517, "percentage": 2.95, "elapsed_time": "0:32:05", "remaining_time": "17:36:02", "throughput": 3347.53, "total_tokens": 6444096} +{"current_steps": 5300, "total_steps": 179580, "loss": 0.083, "lr": 1.4753870141441142e-05, "epoch": 0.5902661766343691, "percentage": 2.95, "elapsed_time": "0:32:06", "remaining_time": "17:36:00", "throughput": 3347.52, "total_tokens": 6450176} +{"current_steps": 5305, "total_steps": 179580, "loss": 0.1776, "lr": 1.4767791513531573e-05, "epoch": 0.5908230315179864, "percentage": 2.95, "elapsed_time": "0:32:08", "remaining_time": "17:35:54", "throughput": 3347.49, "total_tokens": 6455712} +{"current_steps": 5310, "total_steps": 179580, "loss": 0.2819, "lr": 1.4781712885622007e-05, "epoch": 0.5913798864016038, "percentage": 2.96, "elapsed_time": "0:32:10", "remaining_time": "17:35:51", "throughput": 3347.5, "total_tokens": 6461696} +{"current_steps": 5315, "total_steps": 179580, "loss": 0.2434, "lr": 1.479563425771244e-05, "epoch": 0.5919367412852211, "percentage": 2.96, "elapsed_time": "0:32:12", "remaining_time": "17:35:45", "throughput": 3347.47, "total_tokens": 6467328} +{"current_steps": 5320, "total_steps": 179580, "loss": 0.3102, "lr": 1.4809555629802874e-05, "epoch": 0.5924935961688385, "percentage": 2.96, "elapsed_time": "0:32:13", "remaining_time": "17:35:46", "throughput": 3347.49, "total_tokens": 6473696} +{"current_steps": 5325, "total_steps": 179580, "loss": 0.1395, "lr": 1.4823477001893307e-05, "epoch": 0.5930504510524557, "percentage": 2.97, "elapsed_time": "0:32:15", "remaining_time": "17:35:45", "throughput": 3347.54, "total_tokens": 6480000} +{"current_steps": 5330, "total_steps": 179580, "loss": 0.2183, "lr": 1.4837398373983741e-05, "epoch": 0.593607305936073, "percentage": 2.97, "elapsed_time": "0:32:17", "remaining_time": "17:35:41", "throughput": 3347.47, "total_tokens": 6485696} +{"current_steps": 5335, "total_steps": 179580, "loss": 0.277, "lr": 1.4851319746074174e-05, "epoch": 0.5941641608196904, "percentage": 2.97, "elapsed_time": "0:32:19", "remaining_time": "17:35:38", "throughput": 3347.45, "total_tokens": 6491616} +{"current_steps": 5340, "total_steps": 179580, "loss": 0.1561, "lr": 1.4865241118164608e-05, "epoch": 0.5947210157033077, "percentage": 2.97, "elapsed_time": "0:32:21", "remaining_time": "17:35:36", "throughput": 3347.47, "total_tokens": 6497728} +{"current_steps": 5345, "total_steps": 179580, "loss": 0.1769, "lr": 1.487916249025504e-05, "epoch": 0.595277870586925, "percentage": 2.98, "elapsed_time": "0:32:22", "remaining_time": "17:35:36", "throughput": 3347.47, "total_tokens": 6504064} +{"current_steps": 5350, "total_steps": 179580, "loss": 0.3347, "lr": 1.4893083862345472e-05, "epoch": 0.5958347254705424, "percentage": 2.98, "elapsed_time": "0:32:24", "remaining_time": "17:35:33", "throughput": 3347.45, "total_tokens": 6509952} +{"current_steps": 5355, "total_steps": 179580, "loss": 0.3109, "lr": 1.4907005234435906e-05, "epoch": 0.5963915803541597, "percentage": 2.98, "elapsed_time": "0:32:26", "remaining_time": "17:35:31", "throughput": 3347.44, "total_tokens": 6515968} +{"current_steps": 5360, "total_steps": 179580, "loss": 0.1169, "lr": 1.4920926606526339e-05, "epoch": 0.5969484352377771, "percentage": 2.98, "elapsed_time": "0:32:28", "remaining_time": "17:35:26", "throughput": 3347.4, "total_tokens": 6521664} +{"current_steps": 5365, "total_steps": 179580, "loss": 0.2429, "lr": 1.4934847978616773e-05, "epoch": 0.5975052901213944, "percentage": 2.99, "elapsed_time": "0:32:30", "remaining_time": "17:35:26", "throughput": 3347.45, "total_tokens": 6528032} +{"current_steps": 5370, "total_steps": 179580, "loss": 0.1402, "lr": 1.4948769350707206e-05, "epoch": 0.5980621450050116, "percentage": 2.99, "elapsed_time": "0:32:31", "remaining_time": "17:35:25", "throughput": 3347.46, "total_tokens": 6534208} +{"current_steps": 5375, "total_steps": 179580, "loss": 0.1212, "lr": 1.496269072279764e-05, "epoch": 0.598618999888629, "percentage": 2.99, "elapsed_time": "0:32:33", "remaining_time": "17:35:26", "throughput": 3347.47, "total_tokens": 6540672} +{"current_steps": 5380, "total_steps": 179580, "loss": 0.4075, "lr": 1.4976612094888074e-05, "epoch": 0.5991758547722463, "percentage": 3.0, "elapsed_time": "0:32:35", "remaining_time": "17:35:25", "throughput": 3347.48, "total_tokens": 6546784} +{"current_steps": 5385, "total_steps": 179580, "loss": 0.2873, "lr": 1.4990533466978507e-05, "epoch": 0.5997327096558637, "percentage": 3.0, "elapsed_time": "0:32:37", "remaining_time": "17:35:26", "throughput": 3347.49, "total_tokens": 6553248} +{"current_steps": 5390, "total_steps": 179580, "loss": 0.1493, "lr": 1.5004454839068941e-05, "epoch": 0.600289564539481, "percentage": 3.0, "elapsed_time": "0:32:39", "remaining_time": "17:35:25", "throughput": 3347.48, "total_tokens": 6559360} +{"current_steps": 5395, "total_steps": 179580, "loss": 0.1452, "lr": 1.501837621115937e-05, "epoch": 0.6008464194230984, "percentage": 3.0, "elapsed_time": "0:32:41", "remaining_time": "17:35:22", "throughput": 3347.48, "total_tokens": 6565312} +{"current_steps": 5400, "total_steps": 179580, "loss": 0.1445, "lr": 1.5032297583249805e-05, "epoch": 0.6014032743067157, "percentage": 3.01, "elapsed_time": "0:32:43", "remaining_time": "17:35:20", "throughput": 3347.45, "total_tokens": 6571328} +{"current_steps": 5405, "total_steps": 179580, "loss": 0.3237, "lr": 1.5046218955340239e-05, "epoch": 0.601960129190333, "percentage": 3.01, "elapsed_time": "0:32:44", "remaining_time": "17:35:17", "throughput": 3347.4, "total_tokens": 6577248} +{"current_steps": 5410, "total_steps": 179580, "loss": 0.1747, "lr": 1.5060140327430672e-05, "epoch": 0.6025169840739504, "percentage": 3.01, "elapsed_time": "0:32:46", "remaining_time": "17:35:18", "throughput": 3347.42, "total_tokens": 6583648} +{"current_steps": 5415, "total_steps": 179580, "loss": 0.1716, "lr": 1.5074061699521106e-05, "epoch": 0.6030738389575676, "percentage": 3.02, "elapsed_time": "0:32:48", "remaining_time": "17:35:14", "throughput": 3347.42, "total_tokens": 6589504} +{"current_steps": 5420, "total_steps": 179580, "loss": 0.2437, "lr": 1.5087983071611539e-05, "epoch": 0.603630693841185, "percentage": 3.02, "elapsed_time": "0:32:50", "remaining_time": "17:35:14", "throughput": 3347.46, "total_tokens": 6595776} +{"current_steps": 5425, "total_steps": 179580, "loss": 0.1971, "lr": 1.5101904443701973e-05, "epoch": 0.6041875487248023, "percentage": 3.02, "elapsed_time": "0:32:52", "remaining_time": "17:35:11", "throughput": 3347.49, "total_tokens": 6601856} +{"current_steps": 5430, "total_steps": 179580, "loss": 0.4618, "lr": 1.5115825815792406e-05, "epoch": 0.6047444036084196, "percentage": 3.02, "elapsed_time": "0:32:53", "remaining_time": "17:35:04", "throughput": 3347.44, "total_tokens": 6607328} +{"current_steps": 5435, "total_steps": 179580, "loss": 0.294, "lr": 1.512974718788284e-05, "epoch": 0.605301258492037, "percentage": 3.03, "elapsed_time": "0:32:55", "remaining_time": "17:35:02", "throughput": 3347.43, "total_tokens": 6613344} +{"current_steps": 5440, "total_steps": 179580, "loss": 0.1533, "lr": 1.5143668559973273e-05, "epoch": 0.6058581133756543, "percentage": 3.03, "elapsed_time": "0:32:57", "remaining_time": "17:35:02", "throughput": 3347.42, "total_tokens": 6619552} +{"current_steps": 5445, "total_steps": 179580, "loss": 0.3468, "lr": 1.5157589932063703e-05, "epoch": 0.6064149682592717, "percentage": 3.03, "elapsed_time": "0:32:59", "remaining_time": "17:34:55", "throughput": 3347.37, "total_tokens": 6625024} +{"current_steps": 5450, "total_steps": 179580, "loss": 0.1379, "lr": 1.5171511304154138e-05, "epoch": 0.606971823142889, "percentage": 3.03, "elapsed_time": "0:33:01", "remaining_time": "17:34:54", "throughput": 3347.41, "total_tokens": 6631232} +{"current_steps": 5455, "total_steps": 179580, "loss": 0.2837, "lr": 1.518543267624457e-05, "epoch": 0.6075286780265063, "percentage": 3.04, "elapsed_time": "0:33:02", "remaining_time": "17:34:53", "throughput": 3347.41, "total_tokens": 6637408} +{"current_steps": 5460, "total_steps": 179580, "loss": 0.3118, "lr": 1.5199354048335005e-05, "epoch": 0.6080855329101236, "percentage": 3.04, "elapsed_time": "0:33:04", "remaining_time": "17:34:51", "throughput": 3347.44, "total_tokens": 6643552} +{"current_steps": 5465, "total_steps": 179580, "loss": 0.2986, "lr": 1.5213275420425437e-05, "epoch": 0.6086423877937409, "percentage": 3.04, "elapsed_time": "0:33:06", "remaining_time": "17:34:50", "throughput": 3347.45, "total_tokens": 6649728} +{"current_steps": 5470, "total_steps": 179580, "loss": 0.2747, "lr": 1.5227196792515872e-05, "epoch": 0.6091992426773583, "percentage": 3.05, "elapsed_time": "0:33:08", "remaining_time": "17:34:47", "throughput": 3347.42, "total_tokens": 6655680} +{"current_steps": 5475, "total_steps": 179580, "loss": 0.2696, "lr": 1.5241118164606304e-05, "epoch": 0.6097560975609756, "percentage": 3.05, "elapsed_time": "0:33:10", "remaining_time": "17:34:44", "throughput": 3347.42, "total_tokens": 6661664} +{"current_steps": 5480, "total_steps": 179580, "loss": 0.1454, "lr": 1.5255039536696739e-05, "epoch": 0.6103129524445929, "percentage": 3.05, "elapsed_time": "0:33:11", "remaining_time": "17:34:44", "throughput": 3347.47, "total_tokens": 6667968} +{"current_steps": 5485, "total_steps": 179580, "loss": 0.2302, "lr": 1.526896090878717e-05, "epoch": 0.6108698073282103, "percentage": 3.05, "elapsed_time": "0:33:13", "remaining_time": "17:34:42", "throughput": 3347.45, "total_tokens": 6674016} +{"current_steps": 5490, "total_steps": 179580, "loss": 0.3052, "lr": 1.5282882280877602e-05, "epoch": 0.6114266622118276, "percentage": 3.06, "elapsed_time": "0:33:15", "remaining_time": "17:34:41", "throughput": 3347.45, "total_tokens": 6680192} +{"current_steps": 5495, "total_steps": 179580, "loss": 0.1958, "lr": 1.5296803652968037e-05, "epoch": 0.611983517095445, "percentage": 3.06, "elapsed_time": "0:33:17", "remaining_time": "17:34:43", "throughput": 3347.48, "total_tokens": 6686784} +{"current_steps": 5500, "total_steps": 179580, "loss": 0.1603, "lr": 1.531072502505847e-05, "epoch": 0.6125403719790623, "percentage": 3.06, "elapsed_time": "0:33:19", "remaining_time": "17:34:42", "throughput": 3347.49, "total_tokens": 6692960} +{"current_steps": 5505, "total_steps": 179580, "loss": 0.2884, "lr": 1.5324646397148902e-05, "epoch": 0.6130972268626795, "percentage": 3.07, "elapsed_time": "0:33:21", "remaining_time": "17:34:38", "throughput": 3347.46, "total_tokens": 6698784} +{"current_steps": 5510, "total_steps": 179580, "loss": 0.18, "lr": 1.5338567769239336e-05, "epoch": 0.6136540817462969, "percentage": 3.07, "elapsed_time": "0:33:23", "remaining_time": "17:34:39", "throughput": 3347.53, "total_tokens": 6705216} +{"current_steps": 5515, "total_steps": 179580, "loss": 0.1954, "lr": 1.535248914132977e-05, "epoch": 0.6142109366299142, "percentage": 3.07, "elapsed_time": "0:33:24", "remaining_time": "17:34:38", "throughput": 3347.5, "total_tokens": 6711360} +{"current_steps": 5520, "total_steps": 179580, "loss": 0.1894, "lr": 1.5366410513420205e-05, "epoch": 0.6147677915135316, "percentage": 3.07, "elapsed_time": "0:33:26", "remaining_time": "17:34:38", "throughput": 3347.53, "total_tokens": 6717728} +{"current_steps": 5525, "total_steps": 179580, "loss": 0.2553, "lr": 1.538033188551064e-05, "epoch": 0.6153246463971489, "percentage": 3.08, "elapsed_time": "0:33:28", "remaining_time": "17:34:38", "throughput": 3347.54, "total_tokens": 6724000} +{"current_steps": 5530, "total_steps": 179580, "loss": 0.2482, "lr": 1.539425325760107e-05, "epoch": 0.6158815012807662, "percentage": 3.08, "elapsed_time": "0:33:30", "remaining_time": "17:34:37", "throughput": 3347.59, "total_tokens": 6730304} +{"current_steps": 5535, "total_steps": 179580, "loss": 0.2096, "lr": 1.54081746296915e-05, "epoch": 0.6164383561643836, "percentage": 3.08, "elapsed_time": "0:33:32", "remaining_time": "17:34:34", "throughput": 3347.58, "total_tokens": 6736192} +{"current_steps": 5540, "total_steps": 179580, "loss": 0.4417, "lr": 1.5422096001781935e-05, "epoch": 0.6169952110480009, "percentage": 3.08, "elapsed_time": "0:33:33", "remaining_time": "17:34:29", "throughput": 3347.56, "total_tokens": 6741952} +{"current_steps": 5545, "total_steps": 179580, "loss": 0.2122, "lr": 1.543601737387237e-05, "epoch": 0.6175520659316183, "percentage": 3.09, "elapsed_time": "0:33:35", "remaining_time": "17:34:29", "throughput": 3347.58, "total_tokens": 6748256} +{"current_steps": 5550, "total_steps": 179580, "loss": 0.1944, "lr": 1.5449938745962804e-05, "epoch": 0.6181089208152355, "percentage": 3.09, "elapsed_time": "0:33:37", "remaining_time": "17:34:27", "throughput": 3347.59, "total_tokens": 6754336} +{"current_steps": 5555, "total_steps": 179580, "loss": 0.2377, "lr": 1.5463860118053235e-05, "epoch": 0.6186657756988528, "percentage": 3.09, "elapsed_time": "0:33:39", "remaining_time": "17:34:26", "throughput": 3347.6, "total_tokens": 6760512} +{"current_steps": 5560, "total_steps": 179580, "loss": 0.2082, "lr": 1.547778149014367e-05, "epoch": 0.6192226305824702, "percentage": 3.1, "elapsed_time": "0:33:41", "remaining_time": "17:34:25", "throughput": 3347.59, "total_tokens": 6766656} +{"current_steps": 5565, "total_steps": 179580, "loss": 0.2356, "lr": 1.5491702862234104e-05, "epoch": 0.6197794854660875, "percentage": 3.1, "elapsed_time": "0:33:43", "remaining_time": "17:34:26", "throughput": 3347.63, "total_tokens": 6773120} +{"current_steps": 5570, "total_steps": 179580, "loss": 0.1889, "lr": 1.5505624234324538e-05, "epoch": 0.6203363403497049, "percentage": 3.1, "elapsed_time": "0:33:45", "remaining_time": "17:34:26", "throughput": 3347.64, "total_tokens": 6779392} +{"current_steps": 5575, "total_steps": 179580, "loss": 0.2516, "lr": 1.551954560641497e-05, "epoch": 0.6208931952333222, "percentage": 3.1, "elapsed_time": "0:33:46", "remaining_time": "17:34:25", "throughput": 3347.66, "total_tokens": 6785600} +{"current_steps": 5580, "total_steps": 179580, "loss": 0.0842, "lr": 1.55334669785054e-05, "epoch": 0.6214500501169395, "percentage": 3.11, "elapsed_time": "0:33:48", "remaining_time": "17:34:22", "throughput": 3347.67, "total_tokens": 6791680} +{"current_steps": 5585, "total_steps": 179580, "loss": 0.3593, "lr": 1.5547388350595834e-05, "epoch": 0.6220069050005569, "percentage": 3.11, "elapsed_time": "0:33:50", "remaining_time": "17:34:19", "throughput": 3347.69, "total_tokens": 6797664} +{"current_steps": 5590, "total_steps": 179580, "loss": 0.2304, "lr": 1.556130972268627e-05, "epoch": 0.6225637598841742, "percentage": 3.11, "elapsed_time": "0:33:52", "remaining_time": "17:34:19", "throughput": 3347.71, "total_tokens": 6803968} +{"current_steps": 5595, "total_steps": 179580, "loss": 0.1724, "lr": 1.5575231094776703e-05, "epoch": 0.6231206147677915, "percentage": 3.12, "elapsed_time": "0:33:54", "remaining_time": "17:34:18", "throughput": 3347.72, "total_tokens": 6810144} +{"current_steps": 5600, "total_steps": 179580, "loss": 0.3818, "lr": 1.5589152466867134e-05, "epoch": 0.6236774696514088, "percentage": 3.12, "elapsed_time": "0:33:56", "remaining_time": "17:34:18", "throughput": 3347.74, "total_tokens": 6816448} +{"current_steps": 5605, "total_steps": 179580, "loss": 0.2663, "lr": 1.5603073838957568e-05, "epoch": 0.6242343245350261, "percentage": 3.12, "elapsed_time": "0:33:57", "remaining_time": "17:34:15", "throughput": 3347.75, "total_tokens": 6822432} +{"current_steps": 5610, "total_steps": 179580, "loss": 0.2441, "lr": 1.5616995211048002e-05, "epoch": 0.6247911794186435, "percentage": 3.12, "elapsed_time": "0:33:59", "remaining_time": "17:34:06", "throughput": 3347.72, "total_tokens": 6827744} +{"current_steps": 5615, "total_steps": 179580, "loss": 0.0956, "lr": 1.5630916583138437e-05, "epoch": 0.6253480343022608, "percentage": 3.13, "elapsed_time": "0:34:01", "remaining_time": "17:34:07", "throughput": 3347.73, "total_tokens": 6834080} +{"current_steps": 5620, "total_steps": 179580, "loss": 0.1747, "lr": 1.5644837955228868e-05, "epoch": 0.6259048891858782, "percentage": 3.13, "elapsed_time": "0:34:03", "remaining_time": "17:34:03", "throughput": 3347.69, "total_tokens": 6839872} +{"current_steps": 5625, "total_steps": 179580, "loss": 0.2856, "lr": 1.56587593273193e-05, "epoch": 0.6264617440694955, "percentage": 3.13, "elapsed_time": "0:34:04", "remaining_time": "17:34:00", "throughput": 3347.7, "total_tokens": 6845888} +{"current_steps": 5630, "total_steps": 179580, "loss": 0.0992, "lr": 1.5672680699409733e-05, "epoch": 0.6270185989531128, "percentage": 3.14, "elapsed_time": "0:34:06", "remaining_time": "17:33:56", "throughput": 3347.67, "total_tokens": 6851648} +{"current_steps": 5635, "total_steps": 179580, "loss": 0.1186, "lr": 1.5686602071500167e-05, "epoch": 0.6275754538367302, "percentage": 3.14, "elapsed_time": "0:34:08", "remaining_time": "17:33:56", "throughput": 3347.67, "total_tokens": 6857920} +{"current_steps": 5640, "total_steps": 179580, "loss": 0.315, "lr": 1.57005234435906e-05, "epoch": 0.6281323087203475, "percentage": 3.14, "elapsed_time": "0:34:10", "remaining_time": "17:33:52", "throughput": 3347.69, "total_tokens": 6863840} +{"current_steps": 5645, "total_steps": 179580, "loss": 0.1182, "lr": 1.5714444815681033e-05, "epoch": 0.6286891636039648, "percentage": 3.14, "elapsed_time": "0:34:12", "remaining_time": "17:33:52", "throughput": 3347.73, "total_tokens": 6870176} +{"current_steps": 5650, "total_steps": 179580, "loss": 0.1392, "lr": 1.5728366187771467e-05, "epoch": 0.6292460184875821, "percentage": 3.15, "elapsed_time": "0:34:13", "remaining_time": "17:33:50", "throughput": 3347.72, "total_tokens": 6876192} +{"current_steps": 5655, "total_steps": 179580, "loss": 0.1955, "lr": 1.57422875598619e-05, "epoch": 0.6298028733711994, "percentage": 3.15, "elapsed_time": "0:34:15", "remaining_time": "17:33:49", "throughput": 3347.69, "total_tokens": 6882336} +{"current_steps": 5660, "total_steps": 179580, "loss": 0.1509, "lr": 1.5756208931952336e-05, "epoch": 0.6303597282548168, "percentage": 3.15, "elapsed_time": "0:34:17", "remaining_time": "17:33:49", "throughput": 3347.69, "total_tokens": 6888608} +{"current_steps": 5665, "total_steps": 179580, "loss": 0.1942, "lr": 1.577013030404277e-05, "epoch": 0.6309165831384341, "percentage": 3.15, "elapsed_time": "0:34:19", "remaining_time": "17:33:49", "throughput": 3347.72, "total_tokens": 6894944} +{"current_steps": 5670, "total_steps": 179580, "loss": 0.1793, "lr": 1.5784051676133197e-05, "epoch": 0.6314734380220515, "percentage": 3.16, "elapsed_time": "0:34:21", "remaining_time": "17:33:47", "throughput": 3347.7, "total_tokens": 6900960} +{"current_steps": 5675, "total_steps": 179580, "loss": 0.1219, "lr": 1.5797973048223632e-05, "epoch": 0.6320302929056688, "percentage": 3.16, "elapsed_time": "0:34:23", "remaining_time": "17:33:44", "throughput": 3347.68, "total_tokens": 6906880} +{"current_steps": 5680, "total_steps": 179580, "loss": 0.2421, "lr": 1.5811894420314066e-05, "epoch": 0.6325871477892862, "percentage": 3.16, "elapsed_time": "0:34:25", "remaining_time": "17:33:45", "throughput": 3347.67, "total_tokens": 6913280} +{"current_steps": 5685, "total_steps": 179580, "loss": 0.1399, "lr": 1.58258157924045e-05, "epoch": 0.6331440026729035, "percentage": 3.17, "elapsed_time": "0:34:26", "remaining_time": "17:33:44", "throughput": 3347.68, "total_tokens": 6919520} +{"current_steps": 5690, "total_steps": 179580, "loss": 0.2319, "lr": 1.5839737164494935e-05, "epoch": 0.6337008575565207, "percentage": 3.17, "elapsed_time": "0:34:28", "remaining_time": "17:33:44", "throughput": 3347.67, "total_tokens": 6925728} +{"current_steps": 5695, "total_steps": 179580, "loss": 0.1231, "lr": 1.5853658536585366e-05, "epoch": 0.6342577124401381, "percentage": 3.17, "elapsed_time": "0:34:30", "remaining_time": "17:33:42", "throughput": 3347.68, "total_tokens": 6931808} +{"current_steps": 5700, "total_steps": 179580, "loss": 0.1776, "lr": 1.58675799086758e-05, "epoch": 0.6348145673237554, "percentage": 3.17, "elapsed_time": "0:34:32", "remaining_time": "17:33:41", "throughput": 3347.68, "total_tokens": 6938048} +{"current_steps": 5705, "total_steps": 179580, "loss": 0.2214, "lr": 1.5881501280766234e-05, "epoch": 0.6353714222073727, "percentage": 3.18, "elapsed_time": "0:34:34", "remaining_time": "17:33:36", "throughput": 3347.65, "total_tokens": 6943712} +{"current_steps": 5710, "total_steps": 179580, "loss": 0.1354, "lr": 1.589542265285667e-05, "epoch": 0.6359282770909901, "percentage": 3.18, "elapsed_time": "0:34:36", "remaining_time": "17:33:36", "throughput": 3347.62, "total_tokens": 6949888} +{"current_steps": 5715, "total_steps": 179580, "loss": 0.2091, "lr": 1.59093440249471e-05, "epoch": 0.6364851319746074, "percentage": 3.18, "elapsed_time": "0:34:37", "remaining_time": "17:33:36", "throughput": 3347.65, "total_tokens": 6956192} +{"current_steps": 5720, "total_steps": 179580, "loss": 0.244, "lr": 1.592326539703753e-05, "epoch": 0.6370419868582248, "percentage": 3.19, "elapsed_time": "0:34:39", "remaining_time": "17:33:36", "throughput": 3347.69, "total_tokens": 6962624} +{"current_steps": 5725, "total_steps": 179580, "loss": 0.2377, "lr": 1.5937186769127965e-05, "epoch": 0.6375988417418421, "percentage": 3.19, "elapsed_time": "0:34:41", "remaining_time": "17:33:28", "throughput": 3347.64, "total_tokens": 6967904} +{"current_steps": 5730, "total_steps": 179580, "loss": 0.1178, "lr": 1.59511081412184e-05, "epoch": 0.6381556966254595, "percentage": 3.19, "elapsed_time": "0:34:43", "remaining_time": "17:33:27", "throughput": 3347.65, "total_tokens": 6974080} +{"current_steps": 5735, "total_steps": 179580, "loss": 0.1976, "lr": 1.5965029513308834e-05, "epoch": 0.6387125515090767, "percentage": 3.19, "elapsed_time": "0:34:45", "remaining_time": "17:33:27", "throughput": 3347.65, "total_tokens": 6980416} +{"current_steps": 5740, "total_steps": 179580, "loss": 0.1656, "lr": 1.5978950885399264e-05, "epoch": 0.639269406392694, "percentage": 3.2, "elapsed_time": "0:34:46", "remaining_time": "17:33:25", "throughput": 3347.69, "total_tokens": 6986560} +{"current_steps": 5745, "total_steps": 179580, "loss": 0.1058, "lr": 1.59928722574897e-05, "epoch": 0.6398262612763114, "percentage": 3.2, "elapsed_time": "0:34:48", "remaining_time": "17:33:23", "throughput": 3347.73, "total_tokens": 6992704} +{"current_steps": 5750, "total_steps": 179580, "loss": 0.1538, "lr": 1.6006793629580133e-05, "epoch": 0.6403831161599287, "percentage": 3.2, "elapsed_time": "0:34:50", "remaining_time": "17:33:25", "throughput": 3347.79, "total_tokens": 6999296} +{"current_steps": 5755, "total_steps": 179580, "loss": 0.5618, "lr": 1.6020715001670567e-05, "epoch": 0.640939971043546, "percentage": 3.2, "elapsed_time": "0:34:52", "remaining_time": "17:33:24", "throughput": 3347.75, "total_tokens": 7005440} +{"current_steps": 5760, "total_steps": 179580, "loss": 0.1539, "lr": 1.6034636373761e-05, "epoch": 0.6414968259271634, "percentage": 3.21, "elapsed_time": "0:34:54", "remaining_time": "17:33:23", "throughput": 3347.77, "total_tokens": 7011616} +{"current_steps": 5765, "total_steps": 179580, "loss": 0.3539, "lr": 1.604855774585143e-05, "epoch": 0.6420536808107807, "percentage": 3.21, "elapsed_time": "0:34:56", "remaining_time": "17:33:17", "throughput": 3347.76, "total_tokens": 7017184} +{"current_steps": 5770, "total_steps": 179580, "loss": 0.3693, "lr": 1.6062479117941864e-05, "epoch": 0.6426105356943981, "percentage": 3.21, "elapsed_time": "0:34:57", "remaining_time": "17:33:14", "throughput": 3347.74, "total_tokens": 7023104} +{"current_steps": 5775, "total_steps": 179580, "loss": 0.1275, "lr": 1.6076400490032298e-05, "epoch": 0.6431673905780154, "percentage": 3.22, "elapsed_time": "0:34:59", "remaining_time": "17:33:12", "throughput": 3347.74, "total_tokens": 7029248} +{"current_steps": 5780, "total_steps": 179580, "loss": 0.1337, "lr": 1.6090321862122732e-05, "epoch": 0.6437242454616326, "percentage": 3.22, "elapsed_time": "0:35:01", "remaining_time": "17:33:11", "throughput": 3347.71, "total_tokens": 7035296} +{"current_steps": 5785, "total_steps": 179580, "loss": 0.2312, "lr": 1.6104243234213163e-05, "epoch": 0.64428110034525, "percentage": 3.22, "elapsed_time": "0:35:03", "remaining_time": "17:33:10", "throughput": 3347.72, "total_tokens": 7041536} +{"current_steps": 5790, "total_steps": 179580, "loss": 0.2187, "lr": 1.6118164606303598e-05, "epoch": 0.6448379552288673, "percentage": 3.22, "elapsed_time": "0:35:05", "remaining_time": "17:33:08", "throughput": 3347.72, "total_tokens": 7047584} +{"current_steps": 5795, "total_steps": 179580, "loss": 0.0901, "lr": 1.6132085978394032e-05, "epoch": 0.6453948101124847, "percentage": 3.23, "elapsed_time": "0:35:07", "remaining_time": "17:33:08", "throughput": 3347.75, "total_tokens": 7053920} +{"current_steps": 5800, "total_steps": 179580, "loss": 0.1631, "lr": 1.6146007350484466e-05, "epoch": 0.645951664996102, "percentage": 3.23, "elapsed_time": "0:35:08", "remaining_time": "17:33:06", "throughput": 3347.77, "total_tokens": 7060032} +{"current_steps": 5805, "total_steps": 179580, "loss": 0.1023, "lr": 1.61599287225749e-05, "epoch": 0.6465085198797194, "percentage": 3.23, "elapsed_time": "0:35:10", "remaining_time": "17:33:07", "throughput": 3347.78, "total_tokens": 7066464} +{"current_steps": 5810, "total_steps": 179580, "loss": 0.1825, "lr": 1.617385009466533e-05, "epoch": 0.6470653747633367, "percentage": 3.24, "elapsed_time": "0:35:12", "remaining_time": "17:33:05", "throughput": 3347.76, "total_tokens": 7072480} +{"current_steps": 5815, "total_steps": 179580, "loss": 0.2745, "lr": 1.6187771466755762e-05, "epoch": 0.647622229646954, "percentage": 3.24, "elapsed_time": "0:35:14", "remaining_time": "17:33:02", "throughput": 3347.76, "total_tokens": 7078432} +{"current_steps": 5820, "total_steps": 179580, "loss": 0.2596, "lr": 1.6201692838846197e-05, "epoch": 0.6481790845305714, "percentage": 3.24, "elapsed_time": "0:35:16", "remaining_time": "17:33:03", "throughput": 3347.82, "total_tokens": 7084928} +{"current_steps": 5825, "total_steps": 179580, "loss": 0.318, "lr": 1.621561421093663e-05, "epoch": 0.6487359394141886, "percentage": 3.24, "elapsed_time": "0:35:18", "remaining_time": "17:32:59", "throughput": 3347.81, "total_tokens": 7090848} +{"current_steps": 5830, "total_steps": 179580, "loss": 0.203, "lr": 1.6229535583027065e-05, "epoch": 0.649292794297806, "percentage": 3.25, "elapsed_time": "0:35:19", "remaining_time": "17:32:58", "throughput": 3347.79, "total_tokens": 7096928} +{"current_steps": 5835, "total_steps": 179580, "loss": 0.0226, "lr": 1.6243456955117496e-05, "epoch": 0.6498496491814233, "percentage": 3.25, "elapsed_time": "0:35:21", "remaining_time": "17:32:56", "throughput": 3347.8, "total_tokens": 7102976} +{"current_steps": 5840, "total_steps": 179580, "loss": 0.3038, "lr": 1.625737832720793e-05, "epoch": 0.6504065040650406, "percentage": 3.25, "elapsed_time": "0:35:23", "remaining_time": "17:32:57", "throughput": 3347.8, "total_tokens": 7109408} +{"current_steps": 5845, "total_steps": 179580, "loss": 0.2686, "lr": 1.6271299699298365e-05, "epoch": 0.650963358948658, "percentage": 3.25, "elapsed_time": "0:35:25", "remaining_time": "17:32:54", "throughput": 3347.76, "total_tokens": 7115328} +{"current_steps": 5850, "total_steps": 179580, "loss": 0.2144, "lr": 1.62852210713888e-05, "epoch": 0.6515202138322753, "percentage": 3.26, "elapsed_time": "0:35:27", "remaining_time": "17:32:53", "throughput": 3347.78, "total_tokens": 7121536} +{"current_steps": 5855, "total_steps": 179580, "loss": 0.1984, "lr": 1.629914244347923e-05, "epoch": 0.6520770687158927, "percentage": 3.26, "elapsed_time": "0:35:29", "remaining_time": "17:32:51", "throughput": 3347.78, "total_tokens": 7127616} +{"current_steps": 5860, "total_steps": 179580, "loss": 0.1442, "lr": 1.631306381556966e-05, "epoch": 0.65263392359951, "percentage": 3.26, "elapsed_time": "0:35:30", "remaining_time": "17:32:49", "throughput": 3347.82, "total_tokens": 7133760} +{"current_steps": 5865, "total_steps": 179580, "loss": 0.142, "lr": 1.6326985187660096e-05, "epoch": 0.6531907784831273, "percentage": 3.27, "elapsed_time": "0:35:32", "remaining_time": "17:32:49", "throughput": 3347.81, "total_tokens": 7139968} +{"current_steps": 5870, "total_steps": 179580, "loss": 0.1528, "lr": 1.634090655975053e-05, "epoch": 0.6537476333667446, "percentage": 3.27, "elapsed_time": "0:35:34", "remaining_time": "17:32:48", "throughput": 3347.79, "total_tokens": 7146144} +{"current_steps": 5875, "total_steps": 179580, "loss": 0.1006, "lr": 1.6354827931840964e-05, "epoch": 0.6543044882503619, "percentage": 3.27, "elapsed_time": "0:35:36", "remaining_time": "17:32:47", "throughput": 3347.82, "total_tokens": 7152384} +{"current_steps": 5880, "total_steps": 179580, "loss": 0.2766, "lr": 1.6368749303931395e-05, "epoch": 0.6548613431339793, "percentage": 3.27, "elapsed_time": "0:35:38", "remaining_time": "17:32:45", "throughput": 3347.81, "total_tokens": 7158400} +{"current_steps": 5885, "total_steps": 179580, "loss": 0.2568, "lr": 1.638267067602183e-05, "epoch": 0.6554181980175966, "percentage": 3.28, "elapsed_time": "0:35:40", "remaining_time": "17:32:43", "throughput": 3347.81, "total_tokens": 7164544} +{"current_steps": 5890, "total_steps": 179580, "loss": 0.1677, "lr": 1.6396592048112264e-05, "epoch": 0.6559750529012139, "percentage": 3.28, "elapsed_time": "0:35:41", "remaining_time": "17:32:43", "throughput": 3347.83, "total_tokens": 7170848} +{"current_steps": 5895, "total_steps": 179580, "loss": 0.2737, "lr": 1.6410513420202698e-05, "epoch": 0.6565319077848313, "percentage": 3.28, "elapsed_time": "0:35:43", "remaining_time": "17:32:41", "throughput": 3347.78, "total_tokens": 7176736} +{"current_steps": 5900, "total_steps": 179580, "loss": 0.1713, "lr": 1.642443479229313e-05, "epoch": 0.6570887626684486, "percentage": 3.29, "elapsed_time": "0:35:45", "remaining_time": "17:32:40", "throughput": 3347.82, "total_tokens": 7183040} +{"current_steps": 5905, "total_steps": 179580, "loss": 0.2272, "lr": 1.643835616438356e-05, "epoch": 0.657645617552066, "percentage": 3.29, "elapsed_time": "0:35:47", "remaining_time": "17:32:38", "throughput": 3347.87, "total_tokens": 7189248} +{"current_steps": 5910, "total_steps": 179580, "loss": 0.202, "lr": 1.6452277536473994e-05, "epoch": 0.6582024724356833, "percentage": 3.29, "elapsed_time": "0:35:49", "remaining_time": "17:32:37", "throughput": 3347.87, "total_tokens": 7195392} +{"current_steps": 5915, "total_steps": 179580, "loss": 0.1655, "lr": 1.646619890856443e-05, "epoch": 0.6587593273193005, "percentage": 3.29, "elapsed_time": "0:35:51", "remaining_time": "17:32:35", "throughput": 3347.88, "total_tokens": 7201504} +{"current_steps": 5920, "total_steps": 179580, "loss": 0.1656, "lr": 1.6480120280654863e-05, "epoch": 0.6593161822029179, "percentage": 3.3, "elapsed_time": "0:35:52", "remaining_time": "17:32:36", "throughput": 3347.87, "total_tokens": 7207904} +{"current_steps": 5925, "total_steps": 179580, "loss": 0.0671, "lr": 1.6494041652745294e-05, "epoch": 0.6598730370865352, "percentage": 3.3, "elapsed_time": "0:35:54", "remaining_time": "17:32:37", "throughput": 3347.88, "total_tokens": 7214368} +{"current_steps": 5930, "total_steps": 179580, "loss": 0.1583, "lr": 1.650796302483573e-05, "epoch": 0.6604298919701526, "percentage": 3.3, "elapsed_time": "0:35:56", "remaining_time": "17:32:36", "throughput": 3347.87, "total_tokens": 7220480} +{"current_steps": 5935, "total_steps": 179580, "loss": 0.1904, "lr": 1.6521884396926163e-05, "epoch": 0.6609867468537699, "percentage": 3.3, "elapsed_time": "0:35:58", "remaining_time": "17:32:35", "throughput": 3347.88, "total_tokens": 7226688} +{"current_steps": 5940, "total_steps": 179580, "loss": 0.1747, "lr": 1.6535805769016597e-05, "epoch": 0.6615436017373872, "percentage": 3.31, "elapsed_time": "0:36:00", "remaining_time": "17:32:36", "throughput": 3347.92, "total_tokens": 7233152} +{"current_steps": 5945, "total_steps": 179580, "loss": 0.2533, "lr": 1.6549727141107028e-05, "epoch": 0.6621004566210046, "percentage": 3.31, "elapsed_time": "0:36:02", "remaining_time": "17:32:32", "throughput": 3347.92, "total_tokens": 7239040} +{"current_steps": 5950, "total_steps": 179580, "loss": 0.1423, "lr": 1.6563648513197462e-05, "epoch": 0.6626573115046219, "percentage": 3.31, "elapsed_time": "0:36:04", "remaining_time": "17:32:31", "throughput": 3347.96, "total_tokens": 7245280} +{"current_steps": 5955, "total_steps": 179580, "loss": 0.1833, "lr": 1.6577569885287893e-05, "epoch": 0.6632141663882393, "percentage": 3.32, "elapsed_time": "0:36:05", "remaining_time": "17:32:28", "throughput": 3347.94, "total_tokens": 7251168} +{"current_steps": 5960, "total_steps": 179580, "loss": 0.3361, "lr": 1.6591491257378328e-05, "epoch": 0.6637710212718566, "percentage": 3.32, "elapsed_time": "0:36:07", "remaining_time": "17:32:21", "throughput": 3347.92, "total_tokens": 7256608} +{"current_steps": 5965, "total_steps": 179580, "loss": 0.222, "lr": 1.6605412629468762e-05, "epoch": 0.6643278761554738, "percentage": 3.32, "elapsed_time": "0:36:09", "remaining_time": "17:32:18", "throughput": 3347.94, "total_tokens": 7262624} +{"current_steps": 5970, "total_steps": 179580, "loss": 0.1265, "lr": 1.6619334001559196e-05, "epoch": 0.6648847310390912, "percentage": 3.32, "elapsed_time": "0:36:11", "remaining_time": "17:32:15", "throughput": 3347.94, "total_tokens": 7268640} +{"current_steps": 5975, "total_steps": 179580, "loss": 0.1087, "lr": 1.6633255373649627e-05, "epoch": 0.6654415859227085, "percentage": 3.33, "elapsed_time": "0:36:12", "remaining_time": "17:32:15", "throughput": 3347.97, "total_tokens": 7274976} +{"current_steps": 5980, "total_steps": 179580, "loss": 0.2288, "lr": 1.664717674574006e-05, "epoch": 0.6659984408063259, "percentage": 3.33, "elapsed_time": "0:36:14", "remaining_time": "17:32:14", "throughput": 3348.0, "total_tokens": 7281216} +{"current_steps": 5985, "total_steps": 179580, "loss": 0.2447, "lr": 1.6661098117830496e-05, "epoch": 0.6665552956899432, "percentage": 3.33, "elapsed_time": "0:36:16", "remaining_time": "17:32:14", "throughput": 3348.03, "total_tokens": 7287552} +{"current_steps": 5990, "total_steps": 179580, "loss": 0.4444, "lr": 1.6675019489920927e-05, "epoch": 0.6671121505735605, "percentage": 3.34, "elapsed_time": "0:36:18", "remaining_time": "17:32:13", "throughput": 3348.04, "total_tokens": 7293792} +{"current_steps": 5995, "total_steps": 179580, "loss": 0.1082, "lr": 1.668894086201136e-05, "epoch": 0.6676690054571779, "percentage": 3.34, "elapsed_time": "0:36:20", "remaining_time": "17:32:12", "throughput": 3348.04, "total_tokens": 7299936} +{"current_steps": 6000, "total_steps": 179580, "loss": 0.1985, "lr": 1.6702862234101792e-05, "epoch": 0.6682258603407952, "percentage": 3.34, "elapsed_time": "0:36:22", "remaining_time": "17:32:12", "throughput": 3348.05, "total_tokens": 7306240} +{"current_steps": 6005, "total_steps": 179580, "loss": 0.2618, "lr": 1.6716783606192226e-05, "epoch": 0.6687827152244126, "percentage": 3.34, "elapsed_time": "0:36:24", "remaining_time": "17:32:10", "throughput": 3348.06, "total_tokens": 7312320} +{"current_steps": 6010, "total_steps": 179580, "loss": 0.1995, "lr": 1.673070497828266e-05, "epoch": 0.6693395701080298, "percentage": 3.35, "elapsed_time": "0:36:25", "remaining_time": "17:32:10", "throughput": 3348.1, "total_tokens": 7318784} +{"current_steps": 6015, "total_steps": 179580, "loss": 0.2266, "lr": 1.6744626350373095e-05, "epoch": 0.6698964249916471, "percentage": 3.35, "elapsed_time": "0:36:27", "remaining_time": "17:32:12", "throughput": 3348.13, "total_tokens": 7325312} +{"current_steps": 6020, "total_steps": 179580, "loss": 0.2731, "lr": 1.6758547722463526e-05, "epoch": 0.6704532798752645, "percentage": 3.35, "elapsed_time": "0:36:29", "remaining_time": "17:32:09", "throughput": 3348.13, "total_tokens": 7331328} +{"current_steps": 6025, "total_steps": 179580, "loss": 0.1844, "lr": 1.677246909455396e-05, "epoch": 0.6710101347588818, "percentage": 3.36, "elapsed_time": "0:36:31", "remaining_time": "17:32:05", "throughput": 3348.15, "total_tokens": 7337216} +{"current_steps": 6030, "total_steps": 179580, "loss": 0.1553, "lr": 1.6786390466644395e-05, "epoch": 0.6715669896424992, "percentage": 3.36, "elapsed_time": "0:36:33", "remaining_time": "17:32:03", "throughput": 3348.14, "total_tokens": 7343232} +{"current_steps": 6035, "total_steps": 179580, "loss": 0.1973, "lr": 1.6800311838734825e-05, "epoch": 0.6721238445261165, "percentage": 3.36, "elapsed_time": "0:36:35", "remaining_time": "17:32:03", "throughput": 3348.13, "total_tokens": 7349568} +{"current_steps": 6040, "total_steps": 179580, "loss": 0.1229, "lr": 1.681423321082526e-05, "epoch": 0.6726806994097339, "percentage": 3.36, "elapsed_time": "0:36:36", "remaining_time": "17:32:03", "throughput": 3348.13, "total_tokens": 7355776} +{"current_steps": 6045, "total_steps": 179580, "loss": 0.2731, "lr": 1.682815458291569e-05, "epoch": 0.6732375542933512, "percentage": 3.37, "elapsed_time": "0:36:38", "remaining_time": "17:32:01", "throughput": 3348.15, "total_tokens": 7361920} +{"current_steps": 6050, "total_steps": 179580, "loss": 0.4222, "lr": 1.6842075955006125e-05, "epoch": 0.6737944091769685, "percentage": 3.37, "elapsed_time": "0:36:40", "remaining_time": "17:32:01", "throughput": 3348.17, "total_tokens": 7368288} +{"current_steps": 6055, "total_steps": 179580, "loss": 0.2081, "lr": 1.685599732709656e-05, "epoch": 0.6743512640605858, "percentage": 3.37, "elapsed_time": "0:36:42", "remaining_time": "17:31:59", "throughput": 3348.12, "total_tokens": 7374240} +{"current_steps": 6060, "total_steps": 179580, "loss": 0.1422, "lr": 1.6869918699186994e-05, "epoch": 0.6749081189442031, "percentage": 3.37, "elapsed_time": "0:36:44", "remaining_time": "17:31:57", "throughput": 3348.12, "total_tokens": 7380352} +{"current_steps": 6065, "total_steps": 179580, "loss": 0.212, "lr": 1.6883840071277428e-05, "epoch": 0.6754649738278204, "percentage": 3.38, "elapsed_time": "0:36:46", "remaining_time": "17:31:57", "throughput": 3348.11, "total_tokens": 7386592} +{"current_steps": 6070, "total_steps": 179580, "loss": 0.3724, "lr": 1.689776144336786e-05, "epoch": 0.6760218287114378, "percentage": 3.38, "elapsed_time": "0:36:48", "remaining_time": "17:31:56", "throughput": 3348.1, "total_tokens": 7392704} +{"current_steps": 6075, "total_steps": 179580, "loss": 0.1156, "lr": 1.6911682815458293e-05, "epoch": 0.6765786835950551, "percentage": 3.38, "elapsed_time": "0:36:49", "remaining_time": "17:31:54", "throughput": 3348.15, "total_tokens": 7398912} +{"current_steps": 6080, "total_steps": 179580, "loss": 0.1853, "lr": 1.6925604187548724e-05, "epoch": 0.6771355384786725, "percentage": 3.39, "elapsed_time": "0:36:51", "remaining_time": "17:31:52", "throughput": 3348.18, "total_tokens": 7405056} +{"current_steps": 6085, "total_steps": 179580, "loss": 0.1621, "lr": 1.693952555963916e-05, "epoch": 0.6776923933622898, "percentage": 3.39, "elapsed_time": "0:36:53", "remaining_time": "17:31:51", "throughput": 3348.17, "total_tokens": 7411200} +{"current_steps": 6090, "total_steps": 179580, "loss": 0.235, "lr": 1.6953446931729593e-05, "epoch": 0.6782492482459072, "percentage": 3.39, "elapsed_time": "0:36:55", "remaining_time": "17:31:48", "throughput": 3348.14, "total_tokens": 7417152} +{"current_steps": 6095, "total_steps": 179580, "loss": 0.1909, "lr": 1.6967368303820024e-05, "epoch": 0.6788061031295245, "percentage": 3.39, "elapsed_time": "0:36:57", "remaining_time": "17:31:47", "throughput": 3348.15, "total_tokens": 7423360} +{"current_steps": 6100, "total_steps": 179580, "loss": 0.3314, "lr": 1.6981289675910458e-05, "epoch": 0.6793629580131417, "percentage": 3.4, "elapsed_time": "0:36:58", "remaining_time": "17:31:44", "throughput": 3348.16, "total_tokens": 7429344} +{"current_steps": 6105, "total_steps": 179580, "loss": 0.1341, "lr": 1.6995211048000893e-05, "epoch": 0.6799198128967591, "percentage": 3.4, "elapsed_time": "0:37:00", "remaining_time": "17:31:44", "throughput": 3348.17, "total_tokens": 7435616} +{"current_steps": 6110, "total_steps": 179580, "loss": 0.2578, "lr": 1.7009132420091327e-05, "epoch": 0.6804766677803764, "percentage": 3.4, "elapsed_time": "0:37:02", "remaining_time": "17:31:42", "throughput": 3348.22, "total_tokens": 7441824} +{"current_steps": 6115, "total_steps": 179580, "loss": 0.1168, "lr": 1.7023053792181758e-05, "epoch": 0.6810335226639938, "percentage": 3.41, "elapsed_time": "0:37:04", "remaining_time": "17:31:39", "throughput": 3348.26, "total_tokens": 7447808} +{"current_steps": 6120, "total_steps": 179580, "loss": 0.0923, "lr": 1.7036975164272192e-05, "epoch": 0.6815903775476111, "percentage": 3.41, "elapsed_time": "0:37:06", "remaining_time": "17:31:36", "throughput": 3348.21, "total_tokens": 7453632} +{"current_steps": 6125, "total_steps": 179580, "loss": 0.1902, "lr": 1.7050896536362626e-05, "epoch": 0.6821472324312284, "percentage": 3.41, "elapsed_time": "0:37:07", "remaining_time": "17:31:33", "throughput": 3348.2, "total_tokens": 7459648} +{"current_steps": 6130, "total_steps": 179580, "loss": 0.167, "lr": 1.7064817908453057e-05, "epoch": 0.6827040873148458, "percentage": 3.41, "elapsed_time": "0:37:09", "remaining_time": "17:31:33", "throughput": 3348.19, "total_tokens": 7465856} +{"current_steps": 6135, "total_steps": 179580, "loss": 0.3628, "lr": 1.7078739280543492e-05, "epoch": 0.6832609421984631, "percentage": 3.42, "elapsed_time": "0:37:11", "remaining_time": "17:31:29", "throughput": 3348.15, "total_tokens": 7471680} +{"current_steps": 6140, "total_steps": 179580, "loss": 0.1338, "lr": 1.7092660652633923e-05, "epoch": 0.6838177970820805, "percentage": 3.42, "elapsed_time": "0:37:13", "remaining_time": "17:31:27", "throughput": 3348.18, "total_tokens": 7477696} +{"current_steps": 6145, "total_steps": 179580, "loss": 0.1121, "lr": 1.7106582024724357e-05, "epoch": 0.6843746519656977, "percentage": 3.42, "elapsed_time": "0:37:15", "remaining_time": "17:31:24", "throughput": 3348.19, "total_tokens": 7483776} +{"current_steps": 6150, "total_steps": 179580, "loss": 0.3635, "lr": 1.712050339681479e-05, "epoch": 0.684931506849315, "percentage": 3.42, "elapsed_time": "0:37:17", "remaining_time": "17:31:23", "throughput": 3348.17, "total_tokens": 7489856} +{"current_steps": 6155, "total_steps": 179580, "loss": 0.2577, "lr": 1.7134424768905226e-05, "epoch": 0.6854883617329324, "percentage": 3.43, "elapsed_time": "0:37:18", "remaining_time": "17:31:21", "throughput": 3348.19, "total_tokens": 7495968} +{"current_steps": 6160, "total_steps": 179580, "loss": 0.1995, "lr": 1.7148346140995657e-05, "epoch": 0.6860452166165497, "percentage": 3.43, "elapsed_time": "0:37:20", "remaining_time": "17:31:15", "throughput": 3348.18, "total_tokens": 7501536} +{"current_steps": 6165, "total_steps": 179580, "loss": 0.1576, "lr": 1.716226751308609e-05, "epoch": 0.686602071500167, "percentage": 3.43, "elapsed_time": "0:37:22", "remaining_time": "17:31:14", "throughput": 3348.19, "total_tokens": 7507808} +{"current_steps": 6170, "total_steps": 179580, "loss": 0.1215, "lr": 1.7176188885176525e-05, "epoch": 0.6871589263837844, "percentage": 3.44, "elapsed_time": "0:37:24", "remaining_time": "17:31:13", "throughput": 3348.18, "total_tokens": 7513920} +{"current_steps": 6175, "total_steps": 179580, "loss": 0.4492, "lr": 1.7190110257266956e-05, "epoch": 0.6877157812674017, "percentage": 3.44, "elapsed_time": "0:37:25", "remaining_time": "17:31:06", "throughput": 3348.17, "total_tokens": 7519424} +{"current_steps": 6180, "total_steps": 179580, "loss": 0.1512, "lr": 1.720403162935739e-05, "epoch": 0.6882726361510191, "percentage": 3.44, "elapsed_time": "0:37:27", "remaining_time": "17:31:04", "throughput": 3348.19, "total_tokens": 7525504} +{"current_steps": 6185, "total_steps": 179580, "loss": 0.2054, "lr": 1.721795300144782e-05, "epoch": 0.6888294910346364, "percentage": 3.44, "elapsed_time": "0:37:29", "remaining_time": "17:31:03", "throughput": 3348.17, "total_tokens": 7531680} +{"current_steps": 6190, "total_steps": 179580, "loss": 0.1134, "lr": 1.7231874373538256e-05, "epoch": 0.6893863459182537, "percentage": 3.45, "elapsed_time": "0:37:31", "remaining_time": "17:31:03", "throughput": 3348.18, "total_tokens": 7537952} +{"current_steps": 6195, "total_steps": 179580, "loss": 0.1219, "lr": 1.724579574562869e-05, "epoch": 0.689943200801871, "percentage": 3.45, "elapsed_time": "0:37:33", "remaining_time": "17:31:01", "throughput": 3348.19, "total_tokens": 7544000} +{"current_steps": 6200, "total_steps": 179580, "loss": 0.2172, "lr": 1.7259717117719124e-05, "epoch": 0.6905000556854883, "percentage": 3.45, "elapsed_time": "0:37:35", "remaining_time": "17:31:00", "throughput": 3348.19, "total_tokens": 7550240} +{"current_steps": 6205, "total_steps": 179580, "loss": 0.2832, "lr": 1.727363848980956e-05, "epoch": 0.6910569105691057, "percentage": 3.46, "elapsed_time": "0:37:36", "remaining_time": "17:31:02", "throughput": 3348.23, "total_tokens": 7556896} +{"current_steps": 6210, "total_steps": 179580, "loss": 0.1866, "lr": 1.728755986189999e-05, "epoch": 0.691613765452723, "percentage": 3.46, "elapsed_time": "0:37:38", "remaining_time": "17:31:01", "throughput": 3348.23, "total_tokens": 7563040} +{"current_steps": 6215, "total_steps": 179580, "loss": 0.0839, "lr": 1.7301481233990424e-05, "epoch": 0.6921706203363404, "percentage": 3.46, "elapsed_time": "0:37:40", "remaining_time": "17:30:59", "throughput": 3348.22, "total_tokens": 7569088} +{"current_steps": 6220, "total_steps": 179580, "loss": 0.1153, "lr": 1.7315402606080855e-05, "epoch": 0.6927274752199577, "percentage": 3.46, "elapsed_time": "0:37:42", "remaining_time": "17:30:58", "throughput": 3348.27, "total_tokens": 7575392} +{"current_steps": 6225, "total_steps": 179580, "loss": 0.1084, "lr": 1.732932397817129e-05, "epoch": 0.693284330103575, "percentage": 3.47, "elapsed_time": "0:37:44", "remaining_time": "17:30:54", "throughput": 3348.25, "total_tokens": 7581184} +{"current_steps": 6230, "total_steps": 179580, "loss": 0.2464, "lr": 1.7343245350261724e-05, "epoch": 0.6938411849871924, "percentage": 3.47, "elapsed_time": "0:37:45", "remaining_time": "17:30:51", "throughput": 3348.26, "total_tokens": 7587136} +{"current_steps": 6235, "total_steps": 179580, "loss": 0.1825, "lr": 1.7357166722352155e-05, "epoch": 0.6943980398708096, "percentage": 3.47, "elapsed_time": "0:37:47", "remaining_time": "17:30:49", "throughput": 3348.26, "total_tokens": 7593184} +{"current_steps": 6240, "total_steps": 179580, "loss": 0.1725, "lr": 1.737108809444259e-05, "epoch": 0.694954894754427, "percentage": 3.47, "elapsed_time": "0:37:49", "remaining_time": "17:30:48", "throughput": 3348.29, "total_tokens": 7599456} +{"current_steps": 6245, "total_steps": 179580, "loss": 0.2601, "lr": 1.7385009466533023e-05, "epoch": 0.6955117496380443, "percentage": 3.48, "elapsed_time": "0:37:51", "remaining_time": "17:30:40", "throughput": 3348.24, "total_tokens": 7604736} +{"current_steps": 6250, "total_steps": 179580, "loss": 0.1817, "lr": 1.7398930838623458e-05, "epoch": 0.6960686045216616, "percentage": 3.48, "elapsed_time": "0:37:53", "remaining_time": "17:30:41", "throughput": 3348.25, "total_tokens": 7611104} +{"current_steps": 6255, "total_steps": 179580, "loss": 0.1258, "lr": 1.741285221071389e-05, "epoch": 0.696625459405279, "percentage": 3.48, "elapsed_time": "0:37:55", "remaining_time": "17:30:42", "throughput": 3348.29, "total_tokens": 7617664} +{"current_steps": 6260, "total_steps": 179580, "loss": 0.2446, "lr": 1.7426773582804323e-05, "epoch": 0.6971823142888963, "percentage": 3.49, "elapsed_time": "0:37:56", "remaining_time": "17:30:43", "throughput": 3348.34, "total_tokens": 7624160} +{"current_steps": 6265, "total_steps": 179580, "loss": 0.2722, "lr": 1.7440694954894754e-05, "epoch": 0.6977391691725137, "percentage": 3.49, "elapsed_time": "0:37:58", "remaining_time": "17:30:41", "throughput": 3348.32, "total_tokens": 7630240} +{"current_steps": 6270, "total_steps": 179580, "loss": 0.2891, "lr": 1.7454616326985188e-05, "epoch": 0.698296024056131, "percentage": 3.49, "elapsed_time": "0:38:00", "remaining_time": "17:30:40", "throughput": 3348.34, "total_tokens": 7636544} +{"current_steps": 6275, "total_steps": 179580, "loss": 0.174, "lr": 1.7468537699075622e-05, "epoch": 0.6988528789397483, "percentage": 3.49, "elapsed_time": "0:38:02", "remaining_time": "17:30:42", "throughput": 3348.36, "total_tokens": 7643040} +{"current_steps": 6280, "total_steps": 179580, "loss": 0.2243, "lr": 1.7482459071166053e-05, "epoch": 0.6994097338233656, "percentage": 3.5, "elapsed_time": "0:38:04", "remaining_time": "17:30:41", "throughput": 3348.39, "total_tokens": 7649344} +{"current_steps": 6285, "total_steps": 179580, "loss": 0.2318, "lr": 1.7496380443256488e-05, "epoch": 0.6999665887069829, "percentage": 3.5, "elapsed_time": "0:38:06", "remaining_time": "17:30:41", "throughput": 3348.39, "total_tokens": 7655584} +{"current_steps": 6290, "total_steps": 179580, "loss": 0.2505, "lr": 1.7510301815346922e-05, "epoch": 0.7005234435906003, "percentage": 3.5, "elapsed_time": "0:38:08", "remaining_time": "17:30:40", "throughput": 3348.42, "total_tokens": 7661920} +{"current_steps": 6295, "total_steps": 179580, "loss": 0.3568, "lr": 1.7524223187437356e-05, "epoch": 0.7010802984742176, "percentage": 3.51, "elapsed_time": "0:38:10", "remaining_time": "17:30:39", "throughput": 3348.4, "total_tokens": 7668000} +{"current_steps": 6300, "total_steps": 179580, "loss": 0.1609, "lr": 1.7538144559527787e-05, "epoch": 0.7016371533578349, "percentage": 3.51, "elapsed_time": "0:38:11", "remaining_time": "17:30:35", "throughput": 3348.35, "total_tokens": 7673792} +{"current_steps": 6305, "total_steps": 179580, "loss": 0.2697, "lr": 1.755206593161822e-05, "epoch": 0.7021940082414523, "percentage": 3.51, "elapsed_time": "0:38:13", "remaining_time": "17:30:32", "throughput": 3348.35, "total_tokens": 7679744} +{"current_steps": 6310, "total_steps": 179580, "loss": 0.2468, "lr": 1.7565987303708653e-05, "epoch": 0.7027508631250696, "percentage": 3.51, "elapsed_time": "0:38:15", "remaining_time": "17:30:30", "throughput": 3348.35, "total_tokens": 7685792} +{"current_steps": 6315, "total_steps": 179580, "loss": 0.2369, "lr": 1.7579908675799087e-05, "epoch": 0.703307718008687, "percentage": 3.52, "elapsed_time": "0:38:17", "remaining_time": "17:30:30", "throughput": 3348.35, "total_tokens": 7692032} +{"current_steps": 6320, "total_steps": 179580, "loss": 0.1116, "lr": 1.759383004788952e-05, "epoch": 0.7038645728923043, "percentage": 3.52, "elapsed_time": "0:38:18", "remaining_time": "17:30:25", "throughput": 3348.37, "total_tokens": 7697792} +{"current_steps": 6325, "total_steps": 179580, "loss": 0.1153, "lr": 1.7607751419979952e-05, "epoch": 0.7044214277759216, "percentage": 3.52, "elapsed_time": "0:38:20", "remaining_time": "17:30:24", "throughput": 3348.4, "total_tokens": 7704160} +{"current_steps": 6330, "total_steps": 179580, "loss": 0.2803, "lr": 1.7621672792070387e-05, "epoch": 0.7049782826595389, "percentage": 3.52, "elapsed_time": "0:38:22", "remaining_time": "17:30:23", "throughput": 3348.41, "total_tokens": 7710304} +{"current_steps": 6335, "total_steps": 179580, "loss": 0.1766, "lr": 1.763559416416082e-05, "epoch": 0.7055351375431562, "percentage": 3.53, "elapsed_time": "0:38:24", "remaining_time": "17:30:20", "throughput": 3348.43, "total_tokens": 7716320} +{"current_steps": 6340, "total_steps": 179580, "loss": 0.1344, "lr": 1.7649515536251255e-05, "epoch": 0.7060919924267736, "percentage": 3.53, "elapsed_time": "0:38:26", "remaining_time": "17:30:19", "throughput": 3348.47, "total_tokens": 7722592} +{"current_steps": 6345, "total_steps": 179580, "loss": 0.225, "lr": 1.766343690834169e-05, "epoch": 0.7066488473103909, "percentage": 3.53, "elapsed_time": "0:38:28", "remaining_time": "17:30:18", "throughput": 3348.47, "total_tokens": 7728832} +{"current_steps": 6350, "total_steps": 179580, "loss": 0.1358, "lr": 1.767735828043212e-05, "epoch": 0.7072057021940082, "percentage": 3.54, "elapsed_time": "0:38:30", "remaining_time": "17:30:18", "throughput": 3348.49, "total_tokens": 7735136} +{"current_steps": 6355, "total_steps": 179580, "loss": 0.0742, "lr": 1.769127965252255e-05, "epoch": 0.7077625570776256, "percentage": 3.54, "elapsed_time": "0:38:31", "remaining_time": "17:30:17", "throughput": 3348.54, "total_tokens": 7741472} +{"current_steps": 6360, "total_steps": 179580, "loss": 0.0774, "lr": 1.7705201024612986e-05, "epoch": 0.7083194119612429, "percentage": 3.54, "elapsed_time": "0:38:33", "remaining_time": "17:30:15", "throughput": 3348.59, "total_tokens": 7747680} +{"current_steps": 6365, "total_steps": 179580, "loss": 0.15, "lr": 1.771912239670342e-05, "epoch": 0.7088762668448603, "percentage": 3.54, "elapsed_time": "0:38:35", "remaining_time": "17:30:15", "throughput": 3348.58, "total_tokens": 7753856} +{"current_steps": 6370, "total_steps": 179580, "loss": 0.2496, "lr": 1.7733043768793854e-05, "epoch": 0.7094331217284776, "percentage": 3.55, "elapsed_time": "0:38:37", "remaining_time": "17:30:12", "throughput": 3348.6, "total_tokens": 7759872} +{"current_steps": 6375, "total_steps": 179580, "loss": 0.384, "lr": 1.7746965140884285e-05, "epoch": 0.7099899766120948, "percentage": 3.55, "elapsed_time": "0:38:39", "remaining_time": "17:30:10", "throughput": 3348.6, "total_tokens": 7765920} +{"current_steps": 6380, "total_steps": 179580, "loss": 0.2062, "lr": 1.776088651297472e-05, "epoch": 0.7105468314957122, "percentage": 3.55, "elapsed_time": "0:38:40", "remaining_time": "17:30:08", "throughput": 3348.61, "total_tokens": 7772096} +{"current_steps": 6385, "total_steps": 179580, "loss": 0.325, "lr": 1.7774807885065154e-05, "epoch": 0.7111036863793295, "percentage": 3.56, "elapsed_time": "0:38:42", "remaining_time": "17:30:06", "throughput": 3348.58, "total_tokens": 7778112} +{"current_steps": 6390, "total_steps": 179580, "loss": 0.2671, "lr": 1.7788729257155588e-05, "epoch": 0.7116605412629469, "percentage": 3.56, "elapsed_time": "0:38:44", "remaining_time": "17:30:04", "throughput": 3348.59, "total_tokens": 7784128} +{"current_steps": 6395, "total_steps": 179580, "loss": 0.2494, "lr": 1.780265062924602e-05, "epoch": 0.7122173961465642, "percentage": 3.56, "elapsed_time": "0:38:46", "remaining_time": "17:30:00", "throughput": 3348.57, "total_tokens": 7789888} +{"current_steps": 6400, "total_steps": 179580, "loss": 0.1723, "lr": 1.781657200133645e-05, "epoch": 0.7127742510301815, "percentage": 3.56, "elapsed_time": "0:38:48", "remaining_time": "17:29:58", "throughput": 3348.55, "total_tokens": 7795968} +{"current_steps": 6405, "total_steps": 179580, "loss": 0.3804, "lr": 1.7830493373426884e-05, "epoch": 0.7133311059137989, "percentage": 3.57, "elapsed_time": "0:38:49", "remaining_time": "17:29:55", "throughput": 3348.55, "total_tokens": 7801920} +{"current_steps": 6410, "total_steps": 179580, "loss": 0.2118, "lr": 1.784441474551732e-05, "epoch": 0.7138879607974162, "percentage": 3.57, "elapsed_time": "0:38:51", "remaining_time": "17:29:55", "throughput": 3348.6, "total_tokens": 7808320} +{"current_steps": 6415, "total_steps": 179580, "loss": 0.2461, "lr": 1.7858336117607753e-05, "epoch": 0.7144448156810336, "percentage": 3.57, "elapsed_time": "0:38:53", "remaining_time": "17:29:54", "throughput": 3348.63, "total_tokens": 7814656} +{"current_steps": 6420, "total_steps": 179580, "loss": 0.209, "lr": 1.7872257489698184e-05, "epoch": 0.7150016705646508, "percentage": 3.58, "elapsed_time": "0:38:55", "remaining_time": "17:29:54", "throughput": 3348.67, "total_tokens": 7821024} +{"current_steps": 6425, "total_steps": 179580, "loss": 0.0877, "lr": 1.788617886178862e-05, "epoch": 0.7155585254482681, "percentage": 3.58, "elapsed_time": "0:38:57", "remaining_time": "17:29:54", "throughput": 3348.65, "total_tokens": 7827296} +{"current_steps": 6430, "total_steps": 179580, "loss": 0.1941, "lr": 1.7900100233879053e-05, "epoch": 0.7161153803318855, "percentage": 3.58, "elapsed_time": "0:38:59", "remaining_time": "17:29:56", "throughput": 3348.68, "total_tokens": 7833856} +{"current_steps": 6435, "total_steps": 179580, "loss": 0.2169, "lr": 1.7914021605969487e-05, "epoch": 0.7166722352155028, "percentage": 3.58, "elapsed_time": "0:39:01", "remaining_time": "17:29:55", "throughput": 3348.71, "total_tokens": 7840128} +{"current_steps": 6440, "total_steps": 179580, "loss": 0.0964, "lr": 1.7927942978059918e-05, "epoch": 0.7172290900991202, "percentage": 3.59, "elapsed_time": "0:39:03", "remaining_time": "17:29:52", "throughput": 3348.73, "total_tokens": 7846208} +{"current_steps": 6445, "total_steps": 179580, "loss": 0.3389, "lr": 1.7941864350150352e-05, "epoch": 0.7177859449827375, "percentage": 3.59, "elapsed_time": "0:39:04", "remaining_time": "17:29:50", "throughput": 3348.7, "total_tokens": 7852160} +{"current_steps": 6450, "total_steps": 179580, "loss": 0.1043, "lr": 1.7955785722240783e-05, "epoch": 0.7183427998663549, "percentage": 3.59, "elapsed_time": "0:39:06", "remaining_time": "17:29:49", "throughput": 3348.74, "total_tokens": 7858464} +{"current_steps": 6455, "total_steps": 179580, "loss": 0.1962, "lr": 1.7969707094331218e-05, "epoch": 0.7188996547499722, "percentage": 3.59, "elapsed_time": "0:39:08", "remaining_time": "17:29:48", "throughput": 3348.76, "total_tokens": 7864640} +{"current_steps": 6460, "total_steps": 179580, "loss": 0.2932, "lr": 1.7983628466421652e-05, "epoch": 0.7194565096335895, "percentage": 3.6, "elapsed_time": "0:39:10", "remaining_time": "17:29:49", "throughput": 3348.81, "total_tokens": 7871232} +{"current_steps": 6465, "total_steps": 179580, "loss": 0.1306, "lr": 1.7997549838512083e-05, "epoch": 0.7200133645172068, "percentage": 3.6, "elapsed_time": "0:39:12", "remaining_time": "17:29:47", "throughput": 3348.82, "total_tokens": 7877312} +{"current_steps": 6470, "total_steps": 179580, "loss": 0.2154, "lr": 1.8011471210602517e-05, "epoch": 0.7205702194008241, "percentage": 3.6, "elapsed_time": "0:39:14", "remaining_time": "17:29:45", "throughput": 3348.85, "total_tokens": 7883488} +{"current_steps": 6475, "total_steps": 179580, "loss": 0.2824, "lr": 1.802539258269295e-05, "epoch": 0.7211270742844414, "percentage": 3.61, "elapsed_time": "0:39:15", "remaining_time": "17:29:44", "throughput": 3348.88, "total_tokens": 7889760} +{"current_steps": 6480, "total_steps": 179580, "loss": 0.1607, "lr": 1.8039313954783386e-05, "epoch": 0.7216839291680588, "percentage": 3.61, "elapsed_time": "0:39:17", "remaining_time": "17:29:42", "throughput": 3348.83, "total_tokens": 7895744} +{"current_steps": 6485, "total_steps": 179580, "loss": 0.1803, "lr": 1.805323532687382e-05, "epoch": 0.7222407840516761, "percentage": 3.61, "elapsed_time": "0:39:19", "remaining_time": "17:29:43", "throughput": 3348.85, "total_tokens": 7902144} +{"current_steps": 6490, "total_steps": 179580, "loss": 0.1298, "lr": 1.806715669896425e-05, "epoch": 0.7227976389352935, "percentage": 3.61, "elapsed_time": "0:39:21", "remaining_time": "17:29:43", "throughput": 3348.86, "total_tokens": 7908608} +{"current_steps": 6495, "total_steps": 179580, "loss": 0.0694, "lr": 1.8081078071054682e-05, "epoch": 0.7233544938189108, "percentage": 3.62, "elapsed_time": "0:39:23", "remaining_time": "17:29:42", "throughput": 3348.86, "total_tokens": 7914752} +{"current_steps": 6500, "total_steps": 179580, "loss": 0.1319, "lr": 1.8094999443145116e-05, "epoch": 0.7239113487025282, "percentage": 3.62, "elapsed_time": "0:39:25", "remaining_time": "17:29:38", "throughput": 3348.86, "total_tokens": 7920576} +{"current_steps": 6505, "total_steps": 179580, "loss": 0.2307, "lr": 1.810892081523555e-05, "epoch": 0.7244682035861455, "percentage": 3.62, "elapsed_time": "0:39:26", "remaining_time": "17:29:36", "throughput": 3348.82, "total_tokens": 7926560} +{"current_steps": 6510, "total_steps": 179580, "loss": 0.1174, "lr": 1.8122842187325985e-05, "epoch": 0.7250250584697627, "percentage": 3.63, "elapsed_time": "0:39:28", "remaining_time": "17:29:32", "throughput": 3348.83, "total_tokens": 7932416} +{"current_steps": 6515, "total_steps": 179580, "loss": 0.1885, "lr": 1.8136763559416416e-05, "epoch": 0.7255819133533801, "percentage": 3.63, "elapsed_time": "0:39:30", "remaining_time": "17:29:31", "throughput": 3348.85, "total_tokens": 7938656} +{"current_steps": 6520, "total_steps": 179580, "loss": 0.1502, "lr": 1.815068493150685e-05, "epoch": 0.7261387682369974, "percentage": 3.63, "elapsed_time": "0:39:32", "remaining_time": "17:29:30", "throughput": 3348.83, "total_tokens": 7944768} +{"current_steps": 6525, "total_steps": 179580, "loss": 0.3084, "lr": 1.8164606303597285e-05, "epoch": 0.7266956231206148, "percentage": 3.63, "elapsed_time": "0:39:34", "remaining_time": "17:29:27", "throughput": 3348.8, "total_tokens": 7950592} +{"current_steps": 6530, "total_steps": 179580, "loss": 0.1637, "lr": 1.817852767568772e-05, "epoch": 0.7272524780042321, "percentage": 3.64, "elapsed_time": "0:39:35", "remaining_time": "17:29:25", "throughput": 3348.8, "total_tokens": 7956736} +{"current_steps": 6535, "total_steps": 179580, "loss": 0.1523, "lr": 1.819244904777815e-05, "epoch": 0.7278093328878494, "percentage": 3.64, "elapsed_time": "0:39:37", "remaining_time": "17:29:25", "throughput": 3348.79, "total_tokens": 7962944} +{"current_steps": 6540, "total_steps": 179580, "loss": 0.1837, "lr": 1.820637041986858e-05, "epoch": 0.7283661877714668, "percentage": 3.64, "elapsed_time": "0:39:39", "remaining_time": "17:29:21", "throughput": 3348.81, "total_tokens": 7968864} +{"current_steps": 6545, "total_steps": 179580, "loss": 0.3234, "lr": 1.8220291791959015e-05, "epoch": 0.7289230426550841, "percentage": 3.64, "elapsed_time": "0:39:41", "remaining_time": "17:29:20", "throughput": 3348.8, "total_tokens": 7975072} +{"current_steps": 6550, "total_steps": 179580, "loss": 0.3038, "lr": 1.823421316404945e-05, "epoch": 0.7294798975387015, "percentage": 3.65, "elapsed_time": "0:39:43", "remaining_time": "17:29:21", "throughput": 3348.84, "total_tokens": 7981536} +{"current_steps": 6555, "total_steps": 179580, "loss": 0.1867, "lr": 1.8248134536139884e-05, "epoch": 0.7300367524223187, "percentage": 3.65, "elapsed_time": "0:39:45", "remaining_time": "17:29:20", "throughput": 3348.84, "total_tokens": 7987840} +{"current_steps": 6560, "total_steps": 179580, "loss": 0.1753, "lr": 1.8262055908230315e-05, "epoch": 0.730593607305936, "percentage": 3.65, "elapsed_time": "0:39:47", "remaining_time": "17:29:20", "throughput": 3348.85, "total_tokens": 7994112} +{"current_steps": 6565, "total_steps": 179580, "loss": 0.2755, "lr": 1.827597728032075e-05, "epoch": 0.7311504621895534, "percentage": 3.66, "elapsed_time": "0:39:48", "remaining_time": "17:29:19", "throughput": 3348.89, "total_tokens": 8000384} +{"current_steps": 6570, "total_steps": 179580, "loss": 0.1216, "lr": 1.8289898652411183e-05, "epoch": 0.7317073170731707, "percentage": 3.66, "elapsed_time": "0:39:50", "remaining_time": "17:29:18", "throughput": 3348.9, "total_tokens": 8006656} +{"current_steps": 6575, "total_steps": 179580, "loss": 0.0486, "lr": 1.8303820024501618e-05, "epoch": 0.7322641719567881, "percentage": 3.66, "elapsed_time": "0:39:52", "remaining_time": "17:29:17", "throughput": 3348.92, "total_tokens": 8012864} +{"current_steps": 6580, "total_steps": 179580, "loss": 0.1939, "lr": 1.831774139659205e-05, "epoch": 0.7328210268404054, "percentage": 3.66, "elapsed_time": "0:39:54", "remaining_time": "17:29:14", "throughput": 3348.92, "total_tokens": 8018880} +{"current_steps": 6585, "total_steps": 179580, "loss": 0.115, "lr": 1.833166276868248e-05, "epoch": 0.7333778817240227, "percentage": 3.67, "elapsed_time": "0:39:56", "remaining_time": "17:29:13", "throughput": 3348.92, "total_tokens": 8025024} +{"current_steps": 6590, "total_steps": 179580, "loss": 0.1191, "lr": 1.8345584140772914e-05, "epoch": 0.7339347366076401, "percentage": 3.67, "elapsed_time": "0:39:58", "remaining_time": "17:29:11", "throughput": 3348.92, "total_tokens": 8031072} +{"current_steps": 6595, "total_steps": 179580, "loss": 0.2371, "lr": 1.835950551286335e-05, "epoch": 0.7344915914912574, "percentage": 3.67, "elapsed_time": "0:39:59", "remaining_time": "17:29:09", "throughput": 3348.92, "total_tokens": 8037184} +{"current_steps": 6600, "total_steps": 179580, "loss": 0.3163, "lr": 1.8373426884953783e-05, "epoch": 0.7350484463748747, "percentage": 3.68, "elapsed_time": "0:40:01", "remaining_time": "17:29:08", "throughput": 3348.93, "total_tokens": 8043360} +{"current_steps": 6605, "total_steps": 179580, "loss": 0.111, "lr": 1.8387348257044214e-05, "epoch": 0.735605301258492, "percentage": 3.68, "elapsed_time": "0:40:03", "remaining_time": "17:29:06", "throughput": 3348.94, "total_tokens": 8049440} +{"current_steps": 6610, "total_steps": 179580, "loss": 0.3732, "lr": 1.8401269629134648e-05, "epoch": 0.7361621561421093, "percentage": 3.68, "elapsed_time": "0:40:05", "remaining_time": "17:29:03", "throughput": 3348.9, "total_tokens": 8055392} +{"current_steps": 6615, "total_steps": 179580, "loss": 0.209, "lr": 1.8415191001225082e-05, "epoch": 0.7367190110257267, "percentage": 3.68, "elapsed_time": "0:40:07", "remaining_time": "17:29:01", "throughput": 3348.9, "total_tokens": 8061376} +{"current_steps": 6620, "total_steps": 179580, "loss": 0.1918, "lr": 1.8429112373315517e-05, "epoch": 0.737275865909344, "percentage": 3.69, "elapsed_time": "0:40:09", "remaining_time": "17:29:00", "throughput": 3348.93, "total_tokens": 8067744} +{"current_steps": 6625, "total_steps": 179580, "loss": 0.1112, "lr": 1.844303374540595e-05, "epoch": 0.7378327207929614, "percentage": 3.69, "elapsed_time": "0:40:10", "remaining_time": "17:28:58", "throughput": 3348.93, "total_tokens": 8073696} +{"current_steps": 6630, "total_steps": 179580, "loss": 0.2386, "lr": 1.845695511749638e-05, "epoch": 0.7383895756765787, "percentage": 3.69, "elapsed_time": "0:40:12", "remaining_time": "17:28:52", "throughput": 3348.89, "total_tokens": 8079136} +{"current_steps": 6635, "total_steps": 179580, "loss": 0.4441, "lr": 1.8470876489586813e-05, "epoch": 0.738946430560196, "percentage": 3.69, "elapsed_time": "0:40:14", "remaining_time": "17:28:51", "throughput": 3348.88, "total_tokens": 8085344} +{"current_steps": 6640, "total_steps": 179580, "loss": 0.0804, "lr": 1.8484797861677247e-05, "epoch": 0.7395032854438134, "percentage": 3.7, "elapsed_time": "0:40:16", "remaining_time": "17:28:50", "throughput": 3348.87, "total_tokens": 8091520} +{"current_steps": 6645, "total_steps": 179580, "loss": 0.2958, "lr": 1.849871923376768e-05, "epoch": 0.7400601403274307, "percentage": 3.7, "elapsed_time": "0:40:18", "remaining_time": "17:28:48", "throughput": 3348.88, "total_tokens": 8097600} +{"current_steps": 6650, "total_steps": 179580, "loss": 0.148, "lr": 1.8512640605858116e-05, "epoch": 0.740616995211048, "percentage": 3.7, "elapsed_time": "0:40:19", "remaining_time": "17:28:48", "throughput": 3348.89, "total_tokens": 8103968} +{"current_steps": 6655, "total_steps": 179580, "loss": 0.2777, "lr": 1.8526561977948547e-05, "epoch": 0.7411738500946653, "percentage": 3.71, "elapsed_time": "0:40:21", "remaining_time": "17:28:43", "throughput": 3348.86, "total_tokens": 8109664} +{"current_steps": 6660, "total_steps": 179580, "loss": 0.2114, "lr": 1.854048335003898e-05, "epoch": 0.7417307049782826, "percentage": 3.71, "elapsed_time": "0:40:23", "remaining_time": "17:28:40", "throughput": 3348.84, "total_tokens": 8115552} +{"current_steps": 6665, "total_steps": 179580, "loss": 0.1688, "lr": 1.8554404722129415e-05, "epoch": 0.7422875598619, "percentage": 3.71, "elapsed_time": "0:40:25", "remaining_time": "17:28:38", "throughput": 3348.84, "total_tokens": 8121504} +{"current_steps": 6670, "total_steps": 179580, "loss": 0.0761, "lr": 1.856832609421985e-05, "epoch": 0.7428444147455173, "percentage": 3.71, "elapsed_time": "0:40:27", "remaining_time": "17:28:37", "throughput": 3348.85, "total_tokens": 8127776} +{"current_steps": 6675, "total_steps": 179580, "loss": 0.2317, "lr": 1.858224746631028e-05, "epoch": 0.7434012696291347, "percentage": 3.72, "elapsed_time": "0:40:28", "remaining_time": "17:28:36", "throughput": 3348.86, "total_tokens": 8133952} +{"current_steps": 6680, "total_steps": 179580, "loss": 0.2279, "lr": 1.859616883840071e-05, "epoch": 0.743958124512752, "percentage": 3.72, "elapsed_time": "0:40:30", "remaining_time": "17:28:36", "throughput": 3348.89, "total_tokens": 8140416} +{"current_steps": 6685, "total_steps": 179580, "loss": 0.1504, "lr": 1.8610090210491146e-05, "epoch": 0.7445149793963693, "percentage": 3.72, "elapsed_time": "0:40:32", "remaining_time": "17:28:36", "throughput": 3348.88, "total_tokens": 8146688} +{"current_steps": 6690, "total_steps": 179580, "loss": 0.1498, "lr": 1.862401158258158e-05, "epoch": 0.7450718342799867, "percentage": 3.73, "elapsed_time": "0:40:34", "remaining_time": "17:28:29", "throughput": 3348.87, "total_tokens": 8152160} +{"current_steps": 6695, "total_steps": 179580, "loss": 0.1434, "lr": 1.8637932954672015e-05, "epoch": 0.7456286891636039, "percentage": 3.73, "elapsed_time": "0:40:36", "remaining_time": "17:28:27", "throughput": 3348.87, "total_tokens": 8158176} +{"current_steps": 6700, "total_steps": 179580, "loss": 0.3427, "lr": 1.8651854326762445e-05, "epoch": 0.7461855440472213, "percentage": 3.73, "elapsed_time": "0:40:37", "remaining_time": "17:28:26", "throughput": 3348.9, "total_tokens": 8164512} +{"current_steps": 6705, "total_steps": 179580, "loss": 0.2609, "lr": 1.866577569885288e-05, "epoch": 0.7467423989308386, "percentage": 3.73, "elapsed_time": "0:40:39", "remaining_time": "17:28:25", "throughput": 3348.91, "total_tokens": 8170720} +{"current_steps": 6710, "total_steps": 179580, "loss": 0.2468, "lr": 1.8679697070943314e-05, "epoch": 0.7472992538144559, "percentage": 3.74, "elapsed_time": "0:40:41", "remaining_time": "17:28:22", "throughput": 3348.92, "total_tokens": 8176672} +{"current_steps": 6715, "total_steps": 179580, "loss": 0.2891, "lr": 1.869361844303375e-05, "epoch": 0.7478561086980733, "percentage": 3.74, "elapsed_time": "0:40:43", "remaining_time": "17:28:23", "throughput": 3348.94, "total_tokens": 8183168} +{"current_steps": 6720, "total_steps": 179580, "loss": 0.2447, "lr": 1.870753981512418e-05, "epoch": 0.7484129635816906, "percentage": 3.74, "elapsed_time": "0:40:45", "remaining_time": "17:28:20", "throughput": 3348.93, "total_tokens": 8189024} +{"current_steps": 6725, "total_steps": 179580, "loss": 0.3662, "lr": 1.872146118721461e-05, "epoch": 0.748969818465308, "percentage": 3.74, "elapsed_time": "0:40:47", "remaining_time": "17:28:19", "throughput": 3348.93, "total_tokens": 8195264} +{"current_steps": 6730, "total_steps": 179580, "loss": 0.1134, "lr": 1.8735382559305045e-05, "epoch": 0.7495266733489253, "percentage": 3.75, "elapsed_time": "0:40:48", "remaining_time": "17:28:18", "throughput": 3348.95, "total_tokens": 8201472} +{"current_steps": 6735, "total_steps": 179580, "loss": 0.1643, "lr": 1.874930393139548e-05, "epoch": 0.7500835282325427, "percentage": 3.75, "elapsed_time": "0:40:50", "remaining_time": "17:28:16", "throughput": 3348.94, "total_tokens": 8207520} +{"current_steps": 6740, "total_steps": 179580, "loss": 0.2786, "lr": 1.8763225303485913e-05, "epoch": 0.7506403831161599, "percentage": 3.75, "elapsed_time": "0:40:52", "remaining_time": "17:28:13", "throughput": 3348.92, "total_tokens": 8213440} +{"current_steps": 6745, "total_steps": 179580, "loss": 0.1887, "lr": 1.8777146675576344e-05, "epoch": 0.7511972379997772, "percentage": 3.76, "elapsed_time": "0:40:54", "remaining_time": "17:28:11", "throughput": 3348.91, "total_tokens": 8219520} +{"current_steps": 6750, "total_steps": 179580, "loss": 0.242, "lr": 1.879106804766678e-05, "epoch": 0.7517540928833946, "percentage": 3.76, "elapsed_time": "0:40:56", "remaining_time": "17:28:09", "throughput": 3348.92, "total_tokens": 8225600} +{"current_steps": 6755, "total_steps": 179580, "loss": 0.1691, "lr": 1.8804989419757213e-05, "epoch": 0.7523109477670119, "percentage": 3.76, "elapsed_time": "0:40:58", "remaining_time": "17:28:09", "throughput": 3348.94, "total_tokens": 8232000} +{"current_steps": 6760, "total_steps": 179580, "loss": 0.2117, "lr": 1.8818910791847647e-05, "epoch": 0.7528678026506292, "percentage": 3.76, "elapsed_time": "0:40:59", "remaining_time": "17:28:08", "throughput": 3348.95, "total_tokens": 8238208} +{"current_steps": 6765, "total_steps": 179580, "loss": 0.2135, "lr": 1.8832832163938078e-05, "epoch": 0.7534246575342466, "percentage": 3.77, "elapsed_time": "0:41:01", "remaining_time": "17:28:02", "throughput": 3348.96, "total_tokens": 8243840} +{"current_steps": 6770, "total_steps": 179580, "loss": 0.2572, "lr": 1.884675353602851e-05, "epoch": 0.7539815124178639, "percentage": 3.77, "elapsed_time": "0:41:03", "remaining_time": "17:28:02", "throughput": 3348.98, "total_tokens": 8250144} +{"current_steps": 6775, "total_steps": 179580, "loss": 0.2518, "lr": 1.8860674908118943e-05, "epoch": 0.7545383673014813, "percentage": 3.77, "elapsed_time": "0:41:05", "remaining_time": "17:28:00", "throughput": 3349.01, "total_tokens": 8256320} +{"current_steps": 6780, "total_steps": 179580, "loss": 0.1617, "lr": 1.8874596280209378e-05, "epoch": 0.7550952221850986, "percentage": 3.78, "elapsed_time": "0:41:07", "remaining_time": "17:27:58", "throughput": 3349.04, "total_tokens": 8262464} +{"current_steps": 6785, "total_steps": 179580, "loss": 0.2781, "lr": 1.8888517652299812e-05, "epoch": 0.7556520770687158, "percentage": 3.78, "elapsed_time": "0:41:08", "remaining_time": "17:27:57", "throughput": 3349.04, "total_tokens": 8268672} +{"current_steps": 6790, "total_steps": 179580, "loss": 0.2987, "lr": 1.8902439024390246e-05, "epoch": 0.7562089319523332, "percentage": 3.78, "elapsed_time": "0:41:10", "remaining_time": "17:27:54", "throughput": 3349.03, "total_tokens": 8274528} +{"current_steps": 6795, "total_steps": 179580, "loss": 0.2154, "lr": 1.8916360396480677e-05, "epoch": 0.7567657868359505, "percentage": 3.78, "elapsed_time": "0:41:12", "remaining_time": "17:27:52", "throughput": 3349.08, "total_tokens": 8280736} +{"current_steps": 6800, "total_steps": 179580, "loss": 0.2794, "lr": 1.8930281768571112e-05, "epoch": 0.7573226417195679, "percentage": 3.79, "elapsed_time": "0:41:14", "remaining_time": "17:27:47", "throughput": 3349.08, "total_tokens": 8286368} +{"current_steps": 6805, "total_steps": 179580, "loss": 0.1468, "lr": 1.8944203140661546e-05, "epoch": 0.7578794966031852, "percentage": 3.79, "elapsed_time": "0:41:16", "remaining_time": "17:27:45", "throughput": 3349.1, "total_tokens": 8292480} +{"current_steps": 6810, "total_steps": 179580, "loss": 0.16, "lr": 1.895812451275198e-05, "epoch": 0.7584363514868026, "percentage": 3.79, "elapsed_time": "0:41:17", "remaining_time": "17:27:42", "throughput": 3349.09, "total_tokens": 8298528} +{"current_steps": 6815, "total_steps": 179580, "loss": 0.1357, "lr": 1.897204588484241e-05, "epoch": 0.7589932063704199, "percentage": 3.79, "elapsed_time": "0:41:19", "remaining_time": "17:27:39", "throughput": 3349.1, "total_tokens": 8304416} +{"current_steps": 6820, "total_steps": 179580, "loss": 0.1165, "lr": 1.8985967256932842e-05, "epoch": 0.7595500612540372, "percentage": 3.8, "elapsed_time": "0:41:21", "remaining_time": "17:27:36", "throughput": 3349.11, "total_tokens": 8310432} +{"current_steps": 6825, "total_steps": 179580, "loss": 0.2769, "lr": 1.8999888629023277e-05, "epoch": 0.7601069161376546, "percentage": 3.8, "elapsed_time": "0:41:23", "remaining_time": "17:27:32", "throughput": 3349.07, "total_tokens": 8316096} +{"current_steps": 6830, "total_steps": 179580, "loss": 0.2653, "lr": 1.901381000111371e-05, "epoch": 0.7606637710212718, "percentage": 3.8, "elapsed_time": "0:41:24", "remaining_time": "17:27:32", "throughput": 3349.1, "total_tokens": 8322432} +{"current_steps": 6835, "total_steps": 179580, "loss": 0.0979, "lr": 1.9027731373204145e-05, "epoch": 0.7612206259048891, "percentage": 3.81, "elapsed_time": "0:41:26", "remaining_time": "17:27:30", "throughput": 3349.11, "total_tokens": 8328640} +{"current_steps": 6840, "total_steps": 179580, "loss": 0.1586, "lr": 1.9041652745294576e-05, "epoch": 0.7617774807885065, "percentage": 3.81, "elapsed_time": "0:41:28", "remaining_time": "17:27:28", "throughput": 3349.13, "total_tokens": 8334752} +{"current_steps": 6845, "total_steps": 179580, "loss": 0.2888, "lr": 1.905557411738501e-05, "epoch": 0.7623343356721238, "percentage": 3.81, "elapsed_time": "0:41:30", "remaining_time": "17:27:26", "throughput": 3349.13, "total_tokens": 8340800} +{"current_steps": 6850, "total_steps": 179580, "loss": 0.1739, "lr": 1.9069495489475445e-05, "epoch": 0.7628911905557412, "percentage": 3.81, "elapsed_time": "0:41:32", "remaining_time": "17:27:22", "throughput": 3349.07, "total_tokens": 8346464} +{"current_steps": 6855, "total_steps": 179580, "loss": 0.1396, "lr": 1.908341686156588e-05, "epoch": 0.7634480454393585, "percentage": 3.82, "elapsed_time": "0:41:33", "remaining_time": "17:27:18", "throughput": 3349.06, "total_tokens": 8352224} +{"current_steps": 6860, "total_steps": 179580, "loss": 0.2171, "lr": 1.909733823365631e-05, "epoch": 0.7640049003229759, "percentage": 3.82, "elapsed_time": "0:41:35", "remaining_time": "17:27:16", "throughput": 3349.07, "total_tokens": 8358304} +{"current_steps": 6865, "total_steps": 179580, "loss": 0.162, "lr": 1.911125960574674e-05, "epoch": 0.7645617552065932, "percentage": 3.82, "elapsed_time": "0:41:37", "remaining_time": "17:27:14", "throughput": 3349.08, "total_tokens": 8364384} +{"current_steps": 6870, "total_steps": 179580, "loss": 0.2074, "lr": 1.9125180977837175e-05, "epoch": 0.7651186100902105, "percentage": 3.83, "elapsed_time": "0:41:39", "remaining_time": "17:27:10", "throughput": 3349.04, "total_tokens": 8370112} +{"current_steps": 6875, "total_steps": 179580, "loss": 0.2524, "lr": 1.913910234992761e-05, "epoch": 0.7656754649738278, "percentage": 3.83, "elapsed_time": "0:41:41", "remaining_time": "17:27:10", "throughput": 3349.04, "total_tokens": 8376384} +{"current_steps": 6880, "total_steps": 179580, "loss": 0.2413, "lr": 1.9153023722018044e-05, "epoch": 0.7662323198574451, "percentage": 3.83, "elapsed_time": "0:41:42", "remaining_time": "17:27:07", "throughput": 3349.03, "total_tokens": 8382304} +{"current_steps": 6885, "total_steps": 179580, "loss": 0.0735, "lr": 1.9166945094108475e-05, "epoch": 0.7667891747410625, "percentage": 3.83, "elapsed_time": "0:41:44", "remaining_time": "17:27:05", "throughput": 3349.03, "total_tokens": 8388448} +{"current_steps": 6890, "total_steps": 179580, "loss": 0.3039, "lr": 1.918086646619891e-05, "epoch": 0.7673460296246798, "percentage": 3.84, "elapsed_time": "0:41:46", "remaining_time": "17:27:04", "throughput": 3349.02, "total_tokens": 8394560} +{"current_steps": 6895, "total_steps": 179580, "loss": 0.2664, "lr": 1.9194787838289344e-05, "epoch": 0.7679028845082971, "percentage": 3.84, "elapsed_time": "0:41:48", "remaining_time": "17:26:58", "throughput": 3349.01, "total_tokens": 8400032} +{"current_steps": 6900, "total_steps": 179580, "loss": 0.1136, "lr": 1.9208709210379778e-05, "epoch": 0.7684597393919145, "percentage": 3.84, "elapsed_time": "0:41:50", "remaining_time": "17:26:55", "throughput": 3349.01, "total_tokens": 8406080} +{"current_steps": 6905, "total_steps": 179580, "loss": 0.1186, "lr": 1.922263058247021e-05, "epoch": 0.7690165942755318, "percentage": 3.85, "elapsed_time": "0:41:52", "remaining_time": "17:26:58", "throughput": 3348.79, "total_tokens": 8412256} +{"current_steps": 6910, "total_steps": 179580, "loss": 0.1547, "lr": 1.923655195456064e-05, "epoch": 0.7695734491591492, "percentage": 3.85, "elapsed_time": "0:41:53", "remaining_time": "17:26:56", "throughput": 3348.78, "total_tokens": 8418272} +{"current_steps": 6915, "total_steps": 179580, "loss": 0.3193, "lr": 1.9250473326651074e-05, "epoch": 0.7701303040427665, "percentage": 3.85, "elapsed_time": "0:41:55", "remaining_time": "17:26:52", "throughput": 3348.77, "total_tokens": 8424064} +{"current_steps": 6920, "total_steps": 179580, "loss": 0.1761, "lr": 1.926439469874151e-05, "epoch": 0.7706871589263837, "percentage": 3.85, "elapsed_time": "0:41:57", "remaining_time": "17:26:51", "throughput": 3348.76, "total_tokens": 8430208} +{"current_steps": 6925, "total_steps": 179580, "loss": 0.1573, "lr": 1.9278316070831943e-05, "epoch": 0.7712440138100011, "percentage": 3.86, "elapsed_time": "0:41:59", "remaining_time": "17:26:48", "throughput": 3348.73, "total_tokens": 8436064} +{"current_steps": 6930, "total_steps": 179580, "loss": 0.2985, "lr": 1.9292237442922377e-05, "epoch": 0.7718008686936184, "percentage": 3.86, "elapsed_time": "0:42:00", "remaining_time": "17:26:45", "throughput": 3348.73, "total_tokens": 8441984} +{"current_steps": 6935, "total_steps": 179580, "loss": 0.1246, "lr": 1.9306158815012808e-05, "epoch": 0.7723577235772358, "percentage": 3.86, "elapsed_time": "0:42:02", "remaining_time": "17:26:44", "throughput": 3348.74, "total_tokens": 8448256} +{"current_steps": 6940, "total_steps": 179580, "loss": 0.129, "lr": 1.9320080187103242e-05, "epoch": 0.7729145784608531, "percentage": 3.86, "elapsed_time": "0:42:04", "remaining_time": "17:26:43", "throughput": 3348.75, "total_tokens": 8454432} +{"current_steps": 6945, "total_steps": 179580, "loss": 0.1258, "lr": 1.9334001559193677e-05, "epoch": 0.7734714333444704, "percentage": 3.87, "elapsed_time": "0:42:06", "remaining_time": "17:26:39", "throughput": 3348.73, "total_tokens": 8460192} +{"current_steps": 6950, "total_steps": 179580, "loss": 0.1882, "lr": 1.9347922931284108e-05, "epoch": 0.7740282882280878, "percentage": 3.87, "elapsed_time": "0:42:08", "remaining_time": "17:26:38", "throughput": 3348.75, "total_tokens": 8466432} +{"current_steps": 6955, "total_steps": 179580, "loss": 0.1323, "lr": 1.9361844303374542e-05, "epoch": 0.7745851431117051, "percentage": 3.87, "elapsed_time": "0:42:10", "remaining_time": "17:26:37", "throughput": 3348.76, "total_tokens": 8472704} +{"current_steps": 6960, "total_steps": 179580, "loss": 0.0913, "lr": 1.9375765675464973e-05, "epoch": 0.7751419979953225, "percentage": 3.88, "elapsed_time": "0:42:11", "remaining_time": "17:26:34", "throughput": 3348.76, "total_tokens": 8478656} +{"current_steps": 6965, "total_steps": 179580, "loss": 0.3371, "lr": 1.9389687047555407e-05, "epoch": 0.7756988528789397, "percentage": 3.88, "elapsed_time": "0:42:13", "remaining_time": "17:26:33", "throughput": 3348.77, "total_tokens": 8484832} +{"current_steps": 6970, "total_steps": 179580, "loss": 0.1026, "lr": 1.940360841964584e-05, "epoch": 0.776255707762557, "percentage": 3.88, "elapsed_time": "0:42:15", "remaining_time": "17:26:31", "throughput": 3348.79, "total_tokens": 8490880} +{"current_steps": 6975, "total_steps": 179580, "loss": 0.2832, "lr": 1.9417529791736276e-05, "epoch": 0.7768125626461744, "percentage": 3.88, "elapsed_time": "0:42:17", "remaining_time": "17:26:29", "throughput": 3348.79, "total_tokens": 8496992} +{"current_steps": 6980, "total_steps": 179580, "loss": 0.2018, "lr": 1.9431451163826707e-05, "epoch": 0.7773694175297917, "percentage": 3.89, "elapsed_time": "0:42:19", "remaining_time": "17:26:28", "throughput": 3348.78, "total_tokens": 8503200} +{"current_steps": 6985, "total_steps": 179580, "loss": 0.241, "lr": 1.944537253591714e-05, "epoch": 0.7779262724134091, "percentage": 3.89, "elapsed_time": "0:42:21", "remaining_time": "17:26:28", "throughput": 3348.8, "total_tokens": 8509504} +{"current_steps": 6990, "total_steps": 179580, "loss": 0.2594, "lr": 1.9459293908007576e-05, "epoch": 0.7784831272970264, "percentage": 3.89, "elapsed_time": "0:42:22", "remaining_time": "17:26:28", "throughput": 3348.84, "total_tokens": 8516000} +{"current_steps": 6995, "total_steps": 179580, "loss": 0.3243, "lr": 1.9473215280098006e-05, "epoch": 0.7790399821806437, "percentage": 3.9, "elapsed_time": "0:42:24", "remaining_time": "17:26:27", "throughput": 3348.85, "total_tokens": 8522272} +{"current_steps": 7000, "total_steps": 179580, "loss": 0.157, "lr": 1.948713665218844e-05, "epoch": 0.7795968370642611, "percentage": 3.9, "elapsed_time": "0:42:26", "remaining_time": "17:26:23", "throughput": 3348.85, "total_tokens": 8528000} +{"current_steps": 7005, "total_steps": 179580, "loss": 0.0936, "lr": 1.9501058024278872e-05, "epoch": 0.7801536919478784, "percentage": 3.9, "elapsed_time": "0:42:28", "remaining_time": "17:26:19", "throughput": 3348.85, "total_tokens": 8533792} +{"current_steps": 7010, "total_steps": 179580, "loss": 0.1857, "lr": 1.9514979396369306e-05, "epoch": 0.7807105468314958, "percentage": 3.9, "elapsed_time": "0:42:30", "remaining_time": "17:26:21", "throughput": 3348.89, "total_tokens": 8540480} +{"current_steps": 7015, "total_steps": 179580, "loss": 0.338, "lr": 1.952890076845974e-05, "epoch": 0.781267401715113, "percentage": 3.91, "elapsed_time": "0:42:32", "remaining_time": "17:26:19", "throughput": 3348.91, "total_tokens": 8546592} +{"current_steps": 7020, "total_steps": 179580, "loss": 0.2258, "lr": 1.9542822140550175e-05, "epoch": 0.7818242565987303, "percentage": 3.91, "elapsed_time": "0:42:33", "remaining_time": "17:26:16", "throughput": 3348.91, "total_tokens": 8552576} +{"current_steps": 7025, "total_steps": 179580, "loss": 0.2772, "lr": 1.9556743512640606e-05, "epoch": 0.7823811114823477, "percentage": 3.91, "elapsed_time": "0:42:35", "remaining_time": "17:26:14", "throughput": 3348.92, "total_tokens": 8558656} +{"current_steps": 7030, "total_steps": 179580, "loss": 0.2256, "lr": 1.957066488473104e-05, "epoch": 0.782937966365965, "percentage": 3.91, "elapsed_time": "0:42:37", "remaining_time": "17:26:12", "throughput": 3348.93, "total_tokens": 8564736} +{"current_steps": 7035, "total_steps": 179580, "loss": 0.1622, "lr": 1.9584586256821474e-05, "epoch": 0.7834948212495824, "percentage": 3.92, "elapsed_time": "0:42:39", "remaining_time": "17:26:11", "throughput": 3348.92, "total_tokens": 8571008} +{"current_steps": 7040, "total_steps": 179580, "loss": 0.1717, "lr": 1.9598507628911905e-05, "epoch": 0.7840516761331997, "percentage": 3.92, "elapsed_time": "0:42:41", "remaining_time": "17:26:10", "throughput": 3348.96, "total_tokens": 8577312} +{"current_steps": 7045, "total_steps": 179580, "loss": 0.1853, "lr": 1.961242900100234e-05, "epoch": 0.784608531016817, "percentage": 3.92, "elapsed_time": "0:42:43", "remaining_time": "17:26:10", "throughput": 3348.98, "total_tokens": 8583616} +{"current_steps": 7050, "total_steps": 179580, "loss": 0.2177, "lr": 1.962635037309277e-05, "epoch": 0.7851653859004344, "percentage": 3.93, "elapsed_time": "0:42:44", "remaining_time": "17:26:07", "throughput": 3348.97, "total_tokens": 8589536} +{"current_steps": 7055, "total_steps": 179580, "loss": 0.2142, "lr": 1.9640271745183205e-05, "epoch": 0.7857222407840517, "percentage": 3.93, "elapsed_time": "0:42:46", "remaining_time": "17:26:04", "throughput": 3348.93, "total_tokens": 8595424} +{"current_steps": 7060, "total_steps": 179580, "loss": 0.2405, "lr": 1.965419311727364e-05, "epoch": 0.786279095667669, "percentage": 3.93, "elapsed_time": "0:42:48", "remaining_time": "17:26:02", "throughput": 3348.88, "total_tokens": 8601280} +{"current_steps": 7065, "total_steps": 179580, "loss": 0.2006, "lr": 1.9668114489364074e-05, "epoch": 0.7868359505512863, "percentage": 3.93, "elapsed_time": "0:42:50", "remaining_time": "17:26:00", "throughput": 3348.88, "total_tokens": 8607424} +{"current_steps": 7070, "total_steps": 179580, "loss": 0.1396, "lr": 1.9682035861454508e-05, "epoch": 0.7873928054349036, "percentage": 3.94, "elapsed_time": "0:42:52", "remaining_time": "17:25:58", "throughput": 3348.91, "total_tokens": 8613568} +{"current_steps": 7075, "total_steps": 179580, "loss": 0.1282, "lr": 1.969595723354494e-05, "epoch": 0.787949660318521, "percentage": 3.94, "elapsed_time": "0:42:53", "remaining_time": "17:25:56", "throughput": 3348.88, "total_tokens": 8619520} +{"current_steps": 7080, "total_steps": 179580, "loss": 0.0968, "lr": 1.9709878605635373e-05, "epoch": 0.7885065152021383, "percentage": 3.94, "elapsed_time": "0:42:55", "remaining_time": "17:25:56", "throughput": 3348.86, "total_tokens": 8625792} +{"current_steps": 7085, "total_steps": 179580, "loss": 0.1621, "lr": 1.9723799977725804e-05, "epoch": 0.7890633700857557, "percentage": 3.95, "elapsed_time": "0:42:57", "remaining_time": "17:25:55", "throughput": 3348.9, "total_tokens": 8632160} +{"current_steps": 7090, "total_steps": 179580, "loss": 0.2742, "lr": 1.973772134981624e-05, "epoch": 0.789620224969373, "percentage": 3.95, "elapsed_time": "0:42:59", "remaining_time": "17:25:55", "throughput": 3348.91, "total_tokens": 8638432} +{"current_steps": 7095, "total_steps": 179580, "loss": 0.1814, "lr": 1.9751642721906673e-05, "epoch": 0.7901770798529903, "percentage": 3.95, "elapsed_time": "0:43:01", "remaining_time": "17:25:49", "throughput": 3348.91, "total_tokens": 8643936} +{"current_steps": 7100, "total_steps": 179580, "loss": 0.2169, "lr": 1.9765564093997104e-05, "epoch": 0.7907339347366077, "percentage": 3.95, "elapsed_time": "0:43:02", "remaining_time": "17:25:46", "throughput": 3348.91, "total_tokens": 8649952} +{"current_steps": 7105, "total_steps": 179580, "loss": 0.1238, "lr": 1.9779485466087538e-05, "epoch": 0.7912907896202249, "percentage": 3.96, "elapsed_time": "0:43:04", "remaining_time": "17:25:45", "throughput": 3348.88, "total_tokens": 8656000} +{"current_steps": 7110, "total_steps": 179580, "loss": 0.1691, "lr": 1.9793406838177972e-05, "epoch": 0.7918476445038423, "percentage": 3.96, "elapsed_time": "0:43:06", "remaining_time": "17:25:44", "throughput": 3348.9, "total_tokens": 8662304} +{"current_steps": 7115, "total_steps": 179580, "loss": 0.2291, "lr": 1.9807328210268407e-05, "epoch": 0.7924044993874596, "percentage": 3.96, "elapsed_time": "0:43:08", "remaining_time": "17:25:44", "throughput": 3348.91, "total_tokens": 8668736} +{"current_steps": 7120, "total_steps": 179580, "loss": 0.1388, "lr": 1.9821249582358838e-05, "epoch": 0.792961354271077, "percentage": 3.96, "elapsed_time": "0:43:10", "remaining_time": "17:25:44", "throughput": 3348.92, "total_tokens": 8675008} +{"current_steps": 7125, "total_steps": 179580, "loss": 0.1255, "lr": 1.9835170954449272e-05, "epoch": 0.7935182091546943, "percentage": 3.97, "elapsed_time": "0:43:12", "remaining_time": "17:25:41", "throughput": 3348.92, "total_tokens": 8680960} +{"current_steps": 7130, "total_steps": 179580, "loss": 0.236, "lr": 1.9849092326539706e-05, "epoch": 0.7940750640383116, "percentage": 3.97, "elapsed_time": "0:43:14", "remaining_time": "17:25:40", "throughput": 3348.9, "total_tokens": 8687136} +{"current_steps": 7135, "total_steps": 179580, "loss": 0.3053, "lr": 1.9863013698630137e-05, "epoch": 0.794631918921929, "percentage": 3.97, "elapsed_time": "0:43:15", "remaining_time": "17:25:37", "throughput": 3348.91, "total_tokens": 8693120} +{"current_steps": 7140, "total_steps": 179580, "loss": 0.1594, "lr": 1.987693507072057e-05, "epoch": 0.7951887738055463, "percentage": 3.98, "elapsed_time": "0:43:17", "remaining_time": "17:25:36", "throughput": 3348.92, "total_tokens": 8699296} +{"current_steps": 7145, "total_steps": 179580, "loss": 0.2144, "lr": 1.9890856442811002e-05, "epoch": 0.7957456286891637, "percentage": 3.98, "elapsed_time": "0:43:19", "remaining_time": "17:25:33", "throughput": 3348.89, "total_tokens": 8705184} +{"current_steps": 7150, "total_steps": 179580, "loss": 0.2448, "lr": 1.9904777814901437e-05, "epoch": 0.7963024835727809, "percentage": 3.98, "elapsed_time": "0:43:21", "remaining_time": "17:25:31", "throughput": 3348.89, "total_tokens": 8711232} +{"current_steps": 7155, "total_steps": 179580, "loss": 0.1454, "lr": 1.991869918699187e-05, "epoch": 0.7968593384563982, "percentage": 3.98, "elapsed_time": "0:43:23", "remaining_time": "17:25:29", "throughput": 3348.86, "total_tokens": 8717184} +{"current_steps": 7160, "total_steps": 179580, "loss": 0.2974, "lr": 1.9932620559082305e-05, "epoch": 0.7974161933400156, "percentage": 3.99, "elapsed_time": "0:43:24", "remaining_time": "17:25:27", "throughput": 3348.9, "total_tokens": 8723360} +{"current_steps": 7165, "total_steps": 179580, "loss": 0.1301, "lr": 1.9946541931172736e-05, "epoch": 0.7979730482236329, "percentage": 3.99, "elapsed_time": "0:43:26", "remaining_time": "17:25:25", "throughput": 3348.89, "total_tokens": 8729472} +{"current_steps": 7170, "total_steps": 179580, "loss": 0.3452, "lr": 1.996046330326317e-05, "epoch": 0.7985299031072502, "percentage": 3.99, "elapsed_time": "0:43:28", "remaining_time": "17:25:19", "throughput": 3348.88, "total_tokens": 8734944} +{"current_steps": 7175, "total_steps": 179580, "loss": 0.1414, "lr": 1.9974384675353605e-05, "epoch": 0.7990867579908676, "percentage": 4.0, "elapsed_time": "0:43:30", "remaining_time": "17:25:17", "throughput": 3348.92, "total_tokens": 8741056} +{"current_steps": 7180, "total_steps": 179580, "loss": 0.2889, "lr": 1.9988306047444036e-05, "epoch": 0.7996436128744849, "percentage": 4.0, "elapsed_time": "0:43:31", "remaining_time": "17:25:15", "throughput": 3348.9, "total_tokens": 8747040} +{"current_steps": 7185, "total_steps": 179580, "loss": 0.1608, "lr": 2.000222741953447e-05, "epoch": 0.8002004677581023, "percentage": 4.0, "elapsed_time": "0:43:33", "remaining_time": "17:25:14", "throughput": 3348.9, "total_tokens": 8753280} +{"current_steps": 7190, "total_steps": 179580, "loss": 0.1914, "lr": 2.0016148791624905e-05, "epoch": 0.8007573226417196, "percentage": 4.0, "elapsed_time": "0:43:35", "remaining_time": "17:25:13", "throughput": 3348.93, "total_tokens": 8759552} +{"current_steps": 7195, "total_steps": 179580, "loss": 0.3664, "lr": 2.0030070163715336e-05, "epoch": 0.8013141775253368, "percentage": 4.01, "elapsed_time": "0:43:37", "remaining_time": "17:25:12", "throughput": 3348.92, "total_tokens": 8765760} +{"current_steps": 7200, "total_steps": 179580, "loss": 0.311, "lr": 2.004399153580577e-05, "epoch": 0.8018710324089542, "percentage": 4.01, "elapsed_time": "0:43:39", "remaining_time": "17:25:10", "throughput": 3348.91, "total_tokens": 8771776} +{"current_steps": 7205, "total_steps": 179580, "loss": 0.1665, "lr": 2.0057912907896204e-05, "epoch": 0.8024278872925715, "percentage": 4.01, "elapsed_time": "0:43:41", "remaining_time": "17:25:09", "throughput": 3348.95, "total_tokens": 8778144} +{"current_steps": 7210, "total_steps": 179580, "loss": 0.0615, "lr": 2.007183427998664e-05, "epoch": 0.8029847421761889, "percentage": 4.01, "elapsed_time": "0:43:42", "remaining_time": "17:25:07", "throughput": 3348.94, "total_tokens": 8784160} +{"current_steps": 7215, "total_steps": 179580, "loss": 0.2004, "lr": 2.008575565207707e-05, "epoch": 0.8035415970598062, "percentage": 4.02, "elapsed_time": "0:43:44", "remaining_time": "17:25:05", "throughput": 3348.93, "total_tokens": 8790176} +{"current_steps": 7220, "total_steps": 179580, "loss": 0.2365, "lr": 2.0099677024167504e-05, "epoch": 0.8040984519434236, "percentage": 4.02, "elapsed_time": "0:43:46", "remaining_time": "17:25:04", "throughput": 3348.96, "total_tokens": 8796448} +{"current_steps": 7225, "total_steps": 179580, "loss": 0.1044, "lr": 2.0113598396257935e-05, "epoch": 0.8046553068270409, "percentage": 4.02, "elapsed_time": "0:43:48", "remaining_time": "17:25:02", "throughput": 3348.95, "total_tokens": 8802560} +{"current_steps": 7230, "total_steps": 179580, "loss": 0.0781, "lr": 2.012751976834837e-05, "epoch": 0.8052121617106582, "percentage": 4.03, "elapsed_time": "0:43:50", "remaining_time": "17:25:00", "throughput": 3348.95, "total_tokens": 8808608} +{"current_steps": 7235, "total_steps": 179580, "loss": 0.202, "lr": 2.0141441140438803e-05, "epoch": 0.8057690165942756, "percentage": 4.03, "elapsed_time": "0:43:52", "remaining_time": "17:24:57", "throughput": 3348.89, "total_tokens": 8814304} +{"current_steps": 7240, "total_steps": 179580, "loss": 0.0809, "lr": 2.0155362512529234e-05, "epoch": 0.8063258714778928, "percentage": 4.03, "elapsed_time": "0:43:53", "remaining_time": "17:24:54", "throughput": 3348.9, "total_tokens": 8820384} +{"current_steps": 7245, "total_steps": 179580, "loss": 0.3742, "lr": 2.016928388461967e-05, "epoch": 0.8068827263615101, "percentage": 4.03, "elapsed_time": "0:43:55", "remaining_time": "17:24:52", "throughput": 3348.92, "total_tokens": 8826368} +{"current_steps": 7250, "total_steps": 179580, "loss": 0.2364, "lr": 2.0183205256710103e-05, "epoch": 0.8074395812451275, "percentage": 4.04, "elapsed_time": "0:43:57", "remaining_time": "17:24:50", "throughput": 3348.9, "total_tokens": 8832384} +{"current_steps": 7255, "total_steps": 179580, "loss": 0.12, "lr": 2.0197126628800537e-05, "epoch": 0.8079964361287448, "percentage": 4.04, "elapsed_time": "0:43:59", "remaining_time": "17:24:47", "throughput": 3348.91, "total_tokens": 8838464} +{"current_steps": 7260, "total_steps": 179580, "loss": 0.1667, "lr": 2.0211048000890968e-05, "epoch": 0.8085532910123622, "percentage": 4.04, "elapsed_time": "0:44:00", "remaining_time": "17:24:42", "throughput": 3348.88, "total_tokens": 8844032} +{"current_steps": 7265, "total_steps": 179580, "loss": 0.1763, "lr": 2.0224969372981403e-05, "epoch": 0.8091101458959795, "percentage": 4.05, "elapsed_time": "0:44:02", "remaining_time": "17:24:42", "throughput": 3348.86, "total_tokens": 8850272} +{"current_steps": 7270, "total_steps": 179580, "loss": 0.1179, "lr": 2.0238890745071834e-05, "epoch": 0.8096670007795969, "percentage": 4.05, "elapsed_time": "0:44:04", "remaining_time": "17:24:37", "throughput": 3348.87, "total_tokens": 8855936} +{"current_steps": 7275, "total_steps": 179580, "loss": 0.2935, "lr": 2.0252812117162268e-05, "epoch": 0.8102238556632142, "percentage": 4.05, "elapsed_time": "0:44:06", "remaining_time": "17:24:37", "throughput": 3348.89, "total_tokens": 8862272} +{"current_steps": 7280, "total_steps": 179580, "loss": 0.2535, "lr": 2.0266733489252702e-05, "epoch": 0.8107807105468315, "percentage": 4.05, "elapsed_time": "0:44:08", "remaining_time": "17:24:35", "throughput": 3348.9, "total_tokens": 8868416} +{"current_steps": 7285, "total_steps": 179580, "loss": 0.228, "lr": 2.0280654861343133e-05, "epoch": 0.8113375654304488, "percentage": 4.06, "elapsed_time": "0:44:09", "remaining_time": "17:24:33", "throughput": 3348.9, "total_tokens": 8874496} +{"current_steps": 7290, "total_steps": 179580, "loss": 0.1612, "lr": 2.0294576233433567e-05, "epoch": 0.8118944203140661, "percentage": 4.06, "elapsed_time": "0:44:11", "remaining_time": "17:24:32", "throughput": 3348.89, "total_tokens": 8880672} +{"current_steps": 7295, "total_steps": 179580, "loss": 0.3092, "lr": 2.0308497605524002e-05, "epoch": 0.8124512751976835, "percentage": 4.06, "elapsed_time": "0:44:13", "remaining_time": "17:24:30", "throughput": 3348.85, "total_tokens": 8886656} +{"current_steps": 7300, "total_steps": 179580, "loss": 0.1386, "lr": 2.0322418977614436e-05, "epoch": 0.8130081300813008, "percentage": 4.07, "elapsed_time": "0:44:15", "remaining_time": "17:24:28", "throughput": 3348.85, "total_tokens": 8892640} +{"current_steps": 7305, "total_steps": 179580, "loss": 0.2097, "lr": 2.033634034970487e-05, "epoch": 0.8135649849649181, "percentage": 4.07, "elapsed_time": "0:44:17", "remaining_time": "17:24:26", "throughput": 3348.87, "total_tokens": 8898816} +{"current_steps": 7310, "total_steps": 179580, "loss": 0.1531, "lr": 2.03502617217953e-05, "epoch": 0.8141218398485355, "percentage": 4.07, "elapsed_time": "0:44:19", "remaining_time": "17:24:24", "throughput": 3348.84, "total_tokens": 8904736} +{"current_steps": 7315, "total_steps": 179580, "loss": 0.2184, "lr": 2.0364183093885732e-05, "epoch": 0.8146786947321528, "percentage": 4.07, "elapsed_time": "0:44:20", "remaining_time": "17:24:21", "throughput": 3348.84, "total_tokens": 8910688} +{"current_steps": 7320, "total_steps": 179580, "loss": 0.1561, "lr": 2.0378104465976167e-05, "epoch": 0.8152355496157702, "percentage": 4.08, "elapsed_time": "0:44:22", "remaining_time": "17:24:20", "throughput": 3348.86, "total_tokens": 8916992} +{"current_steps": 7325, "total_steps": 179580, "loss": 0.1486, "lr": 2.03920258380666e-05, "epoch": 0.8157924044993875, "percentage": 4.08, "elapsed_time": "0:44:24", "remaining_time": "17:24:13", "throughput": 3348.82, "total_tokens": 8922240} +{"current_steps": 7330, "total_steps": 179580, "loss": 0.2212, "lr": 2.0405947210157035e-05, "epoch": 0.8163492593830048, "percentage": 4.08, "elapsed_time": "0:44:26", "remaining_time": "17:24:09", "throughput": 3348.83, "total_tokens": 8928000} +{"current_steps": 7335, "total_steps": 179580, "loss": 0.2771, "lr": 2.0419868582247466e-05, "epoch": 0.8169061142666221, "percentage": 4.08, "elapsed_time": "0:44:27", "remaining_time": "17:24:06", "throughput": 3348.84, "total_tokens": 8934016} +{"current_steps": 7340, "total_steps": 179580, "loss": 0.3886, "lr": 2.04337899543379e-05, "epoch": 0.8174629691502394, "percentage": 4.09, "elapsed_time": "0:44:29", "remaining_time": "17:24:05", "throughput": 3348.86, "total_tokens": 8940192} +{"current_steps": 7345, "total_steps": 179580, "loss": 0.2112, "lr": 2.0447711326428335e-05, "epoch": 0.8180198240338568, "percentage": 4.09, "elapsed_time": "0:44:31", "remaining_time": "17:24:05", "throughput": 3348.88, "total_tokens": 8946592} +{"current_steps": 7350, "total_steps": 179580, "loss": 0.2207, "lr": 2.046163269851877e-05, "epoch": 0.8185766789174741, "percentage": 4.09, "elapsed_time": "0:44:33", "remaining_time": "17:24:02", "throughput": 3348.86, "total_tokens": 8952448} +{"current_steps": 7355, "total_steps": 179580, "loss": 0.2625, "lr": 2.04755540706092e-05, "epoch": 0.8191335338010914, "percentage": 4.1, "elapsed_time": "0:44:35", "remaining_time": "17:23:58", "throughput": 3348.87, "total_tokens": 8958336} +{"current_steps": 7360, "total_steps": 179580, "loss": 0.1882, "lr": 2.048947544269963e-05, "epoch": 0.8196903886847088, "percentage": 4.1, "elapsed_time": "0:44:36", "remaining_time": "17:23:57", "throughput": 3348.85, "total_tokens": 8964448} +{"current_steps": 7365, "total_steps": 179580, "loss": 0.1898, "lr": 2.0503396814790065e-05, "epoch": 0.8202472435683261, "percentage": 4.1, "elapsed_time": "0:44:38", "remaining_time": "17:23:52", "throughput": 3348.85, "total_tokens": 8970048} +{"current_steps": 7370, "total_steps": 179580, "loss": 0.1083, "lr": 2.05173181868805e-05, "epoch": 0.8208040984519435, "percentage": 4.1, "elapsed_time": "0:44:40", "remaining_time": "17:23:50", "throughput": 3348.76, "total_tokens": 8975968} +{"current_steps": 7375, "total_steps": 179580, "loss": 0.1673, "lr": 2.0531239558970934e-05, "epoch": 0.8213609533355608, "percentage": 4.11, "elapsed_time": "0:44:42", "remaining_time": "17:23:49", "throughput": 3348.79, "total_tokens": 8982240} +{"current_steps": 7380, "total_steps": 179580, "loss": 0.1593, "lr": 2.0545160931061365e-05, "epoch": 0.821917808219178, "percentage": 4.11, "elapsed_time": "0:44:44", "remaining_time": "17:23:47", "throughput": 3348.76, "total_tokens": 8988256} +{"current_steps": 7385, "total_steps": 179580, "loss": 0.2373, "lr": 2.05590823031518e-05, "epoch": 0.8224746631027954, "percentage": 4.11, "elapsed_time": "0:44:45", "remaining_time": "17:23:47", "throughput": 3348.77, "total_tokens": 8994528} +{"current_steps": 7390, "total_steps": 179580, "loss": 0.2565, "lr": 2.0573003675242234e-05, "epoch": 0.8230315179864127, "percentage": 4.12, "elapsed_time": "0:44:47", "remaining_time": "17:23:45", "throughput": 3348.75, "total_tokens": 9000576} +{"current_steps": 7395, "total_steps": 179580, "loss": 0.2172, "lr": 2.0586925047332668e-05, "epoch": 0.8235883728700301, "percentage": 4.12, "elapsed_time": "0:44:49", "remaining_time": "17:23:44", "throughput": 3348.74, "total_tokens": 9006688} +{"current_steps": 7400, "total_steps": 179580, "loss": 0.4001, "lr": 2.06008464194231e-05, "epoch": 0.8241452277536474, "percentage": 4.12, "elapsed_time": "0:44:51", "remaining_time": "17:23:43", "throughput": 3348.73, "total_tokens": 9012864} +{"current_steps": 7405, "total_steps": 179580, "loss": 0.2127, "lr": 2.061476779151353e-05, "epoch": 0.8247020826372647, "percentage": 4.12, "elapsed_time": "0:44:53", "remaining_time": "17:23:41", "throughput": 3348.77, "total_tokens": 9019072} +{"current_steps": 7410, "total_steps": 179580, "loss": 0.097, "lr": 2.0628689163603964e-05, "epoch": 0.8252589375208821, "percentage": 4.13, "elapsed_time": "0:44:55", "remaining_time": "17:23:40", "throughput": 3348.76, "total_tokens": 9025280} +{"current_steps": 7415, "total_steps": 179580, "loss": 0.2799, "lr": 2.06426105356944e-05, "epoch": 0.8258157924044994, "percentage": 4.13, "elapsed_time": "0:44:56", "remaining_time": "17:23:37", "throughput": 3348.78, "total_tokens": 9031200} +{"current_steps": 7420, "total_steps": 179580, "loss": 0.1223, "lr": 2.0656531907784833e-05, "epoch": 0.8263726472881168, "percentage": 4.13, "elapsed_time": "0:44:58", "remaining_time": "17:23:32", "throughput": 3348.73, "total_tokens": 9036704} +{"current_steps": 7425, "total_steps": 179580, "loss": 0.128, "lr": 2.0670453279875264e-05, "epoch": 0.826929502171734, "percentage": 4.13, "elapsed_time": "0:45:00", "remaining_time": "17:23:31", "throughput": 3348.76, "total_tokens": 9043040} +{"current_steps": 7430, "total_steps": 179580, "loss": 0.2697, "lr": 2.0684374651965698e-05, "epoch": 0.8274863570553513, "percentage": 4.14, "elapsed_time": "0:45:02", "remaining_time": "17:23:28", "throughput": 3348.74, "total_tokens": 9048864} +{"current_steps": 7435, "total_steps": 179580, "loss": 0.1074, "lr": 2.0698296024056133e-05, "epoch": 0.8280432119389687, "percentage": 4.14, "elapsed_time": "0:45:04", "remaining_time": "17:23:27", "throughput": 3348.75, "total_tokens": 9055168} +{"current_steps": 7440, "total_steps": 179580, "loss": 0.1686, "lr": 2.0712217396146567e-05, "epoch": 0.828600066822586, "percentage": 4.14, "elapsed_time": "0:45:05", "remaining_time": "17:23:26", "throughput": 3348.76, "total_tokens": 9061312} +{"current_steps": 7445, "total_steps": 179580, "loss": 0.1211, "lr": 2.0726138768237e-05, "epoch": 0.8291569217062034, "percentage": 4.15, "elapsed_time": "0:45:07", "remaining_time": "17:23:24", "throughput": 3348.77, "total_tokens": 9067392} +{"current_steps": 7450, "total_steps": 179580, "loss": 0.0732, "lr": 2.0740060140327432e-05, "epoch": 0.8297137765898207, "percentage": 4.15, "elapsed_time": "0:45:09", "remaining_time": "17:23:22", "throughput": 3348.74, "total_tokens": 9073440} +{"current_steps": 7455, "total_steps": 179580, "loss": 0.208, "lr": 2.0753981512417863e-05, "epoch": 0.830270631473438, "percentage": 4.15, "elapsed_time": "0:45:11", "remaining_time": "17:23:21", "throughput": 3348.73, "total_tokens": 9079616} +{"current_steps": 7460, "total_steps": 179580, "loss": 0.1556, "lr": 2.0767902884508297e-05, "epoch": 0.8308274863570554, "percentage": 4.15, "elapsed_time": "0:45:13", "remaining_time": "17:23:15", "throughput": 3348.72, "total_tokens": 9085120} +{"current_steps": 7465, "total_steps": 179580, "loss": 0.1136, "lr": 2.0781824256598732e-05, "epoch": 0.8313843412406727, "percentage": 4.16, "elapsed_time": "0:45:14", "remaining_time": "17:23:14", "throughput": 3348.73, "total_tokens": 9091360} +{"current_steps": 7470, "total_steps": 179580, "loss": 0.0884, "lr": 2.0795745628689166e-05, "epoch": 0.83194119612429, "percentage": 4.16, "elapsed_time": "0:45:16", "remaining_time": "17:23:12", "throughput": 3348.73, "total_tokens": 9097440} +{"current_steps": 7475, "total_steps": 179580, "loss": 0.1957, "lr": 2.0809667000779597e-05, "epoch": 0.8324980510079073, "percentage": 4.16, "elapsed_time": "0:45:18", "remaining_time": "17:23:11", "throughput": 3348.76, "total_tokens": 9103680} +{"current_steps": 7480, "total_steps": 179580, "loss": 0.2979, "lr": 2.082358837287003e-05, "epoch": 0.8330549058915246, "percentage": 4.17, "elapsed_time": "0:45:20", "remaining_time": "17:23:08", "throughput": 3348.76, "total_tokens": 9109632} +{"current_steps": 7485, "total_steps": 179580, "loss": 0.1764, "lr": 2.0837509744960466e-05, "epoch": 0.833611760775142, "percentage": 4.17, "elapsed_time": "0:45:22", "remaining_time": "17:23:07", "throughput": 3348.75, "total_tokens": 9115712} +{"current_steps": 7490, "total_steps": 179580, "loss": 0.1786, "lr": 2.08514311170509e-05, "epoch": 0.8341686156587593, "percentage": 4.17, "elapsed_time": "0:45:23", "remaining_time": "17:23:06", "throughput": 3348.74, "total_tokens": 9121920} +{"current_steps": 7495, "total_steps": 179580, "loss": 0.2104, "lr": 2.086535248914133e-05, "epoch": 0.8347254705423767, "percentage": 4.17, "elapsed_time": "0:45:25", "remaining_time": "17:23:03", "throughput": 3348.74, "total_tokens": 9127936} +{"current_steps": 7500, "total_steps": 179580, "loss": 0.2645, "lr": 2.0879273861231762e-05, "epoch": 0.835282325425994, "percentage": 4.18, "elapsed_time": "0:45:27", "remaining_time": "17:23:01", "throughput": 3348.73, "total_tokens": 9133952} +{"current_steps": 7505, "total_steps": 179580, "loss": 0.2745, "lr": 2.0893195233322196e-05, "epoch": 0.8358391803096114, "percentage": 4.18, "elapsed_time": "0:45:29", "remaining_time": "17:22:59", "throughput": 3348.74, "total_tokens": 9140032} +{"current_steps": 7510, "total_steps": 179580, "loss": 0.2653, "lr": 2.090711660541263e-05, "epoch": 0.8363960351932287, "percentage": 4.18, "elapsed_time": "0:45:31", "remaining_time": "17:22:54", "throughput": 3348.7, "total_tokens": 9145504} +{"current_steps": 7515, "total_steps": 179580, "loss": 0.2727, "lr": 2.0921037977503065e-05, "epoch": 0.8369528900768459, "percentage": 4.18, "elapsed_time": "0:45:32", "remaining_time": "17:22:53", "throughput": 3348.73, "total_tokens": 9151776} +{"current_steps": 7520, "total_steps": 179580, "loss": 0.2034, "lr": 2.0934959349593496e-05, "epoch": 0.8375097449604633, "percentage": 4.19, "elapsed_time": "0:45:34", "remaining_time": "17:22:53", "throughput": 3348.73, "total_tokens": 9158144} +{"current_steps": 7525, "total_steps": 179580, "loss": 0.3384, "lr": 2.094888072168393e-05, "epoch": 0.8380665998440806, "percentage": 4.19, "elapsed_time": "0:45:36", "remaining_time": "17:22:49", "throughput": 3348.73, "total_tokens": 9164000} +{"current_steps": 7530, "total_steps": 179580, "loss": 0.2383, "lr": 2.0962802093774364e-05, "epoch": 0.838623454727698, "percentage": 4.19, "elapsed_time": "0:45:38", "remaining_time": "17:22:47", "throughput": 3348.72, "total_tokens": 9170016} +{"current_steps": 7535, "total_steps": 179580, "loss": 0.2426, "lr": 2.09767234658648e-05, "epoch": 0.8391803096113153, "percentage": 4.2, "elapsed_time": "0:45:40", "remaining_time": "17:22:46", "throughput": 3348.72, "total_tokens": 9176128} +{"current_steps": 7540, "total_steps": 179580, "loss": 0.271, "lr": 2.099064483795523e-05, "epoch": 0.8397371644949326, "percentage": 4.2, "elapsed_time": "0:45:42", "remaining_time": "17:22:46", "throughput": 3348.72, "total_tokens": 9182464} +{"current_steps": 7545, "total_steps": 179580, "loss": 0.1439, "lr": 2.100456621004566e-05, "epoch": 0.84029401937855, "percentage": 4.2, "elapsed_time": "0:45:43", "remaining_time": "17:22:43", "throughput": 3348.72, "total_tokens": 9188416} +{"current_steps": 7550, "total_steps": 179580, "loss": 0.0776, "lr": 2.1018487582136095e-05, "epoch": 0.8408508742621673, "percentage": 4.2, "elapsed_time": "0:45:45", "remaining_time": "17:22:40", "throughput": 3348.7, "total_tokens": 9194272} +{"current_steps": 7555, "total_steps": 179580, "loss": 0.2866, "lr": 2.103240895422653e-05, "epoch": 0.8414077291457847, "percentage": 4.21, "elapsed_time": "0:45:47", "remaining_time": "17:22:39", "throughput": 3348.68, "total_tokens": 9200416} +{"current_steps": 7560, "total_steps": 179580, "loss": 0.1603, "lr": 2.1046330326316964e-05, "epoch": 0.8419645840294019, "percentage": 4.21, "elapsed_time": "0:45:49", "remaining_time": "17:22:39", "throughput": 3348.69, "total_tokens": 9206880} +{"current_steps": 7565, "total_steps": 179580, "loss": 0.0958, "lr": 2.1060251698407395e-05, "epoch": 0.8425214389130192, "percentage": 4.21, "elapsed_time": "0:45:51", "remaining_time": "17:22:36", "throughput": 3348.72, "total_tokens": 9212864} +{"current_steps": 7570, "total_steps": 179580, "loss": 0.2083, "lr": 2.107417307049783e-05, "epoch": 0.8430782937966366, "percentage": 4.22, "elapsed_time": "0:45:52", "remaining_time": "17:22:25", "throughput": 3348.64, "total_tokens": 9217376} +{"current_steps": 7575, "total_steps": 179580, "loss": 0.2269, "lr": 2.1088094442588263e-05, "epoch": 0.8436351486802539, "percentage": 4.22, "elapsed_time": "0:45:54", "remaining_time": "17:22:21", "throughput": 3348.64, "total_tokens": 9223168} +{"current_steps": 7580, "total_steps": 179580, "loss": 0.3361, "lr": 2.1102015814678698e-05, "epoch": 0.8441920035638713, "percentage": 4.22, "elapsed_time": "0:45:56", "remaining_time": "17:22:19", "throughput": 3348.63, "total_tokens": 9229184} +{"current_steps": 7585, "total_steps": 179580, "loss": 0.1561, "lr": 2.1115937186769132e-05, "epoch": 0.8447488584474886, "percentage": 4.22, "elapsed_time": "0:45:57", "remaining_time": "17:22:17", "throughput": 3348.63, "total_tokens": 9235168} +{"current_steps": 7590, "total_steps": 179580, "loss": 0.1415, "lr": 2.112985855885956e-05, "epoch": 0.8453057133311059, "percentage": 4.23, "elapsed_time": "0:45:59", "remaining_time": "17:22:16", "throughput": 3348.68, "total_tokens": 9241504} +{"current_steps": 7595, "total_steps": 179580, "loss": 0.2274, "lr": 2.1143779930949994e-05, "epoch": 0.8458625682147233, "percentage": 4.23, "elapsed_time": "0:46:01", "remaining_time": "17:22:13", "throughput": 3348.68, "total_tokens": 9247552} +{"current_steps": 7600, "total_steps": 179580, "loss": 0.195, "lr": 2.1157701303040428e-05, "epoch": 0.8464194230983406, "percentage": 4.23, "elapsed_time": "0:46:03", "remaining_time": "17:22:13", "throughput": 3348.71, "total_tokens": 9253888} +{"current_steps": 7605, "total_steps": 179580, "loss": 0.2606, "lr": 2.1171622675130862e-05, "epoch": 0.8469762779819578, "percentage": 4.23, "elapsed_time": "0:46:05", "remaining_time": "17:22:13", "throughput": 3348.71, "total_tokens": 9260256} +{"current_steps": 7610, "total_steps": 179580, "loss": 0.2446, "lr": 2.1185544047221297e-05, "epoch": 0.8475331328655752, "percentage": 4.24, "elapsed_time": "0:46:07", "remaining_time": "17:22:13", "throughput": 3348.73, "total_tokens": 9266656} +{"current_steps": 7615, "total_steps": 179580, "loss": 0.0695, "lr": 2.1199465419311728e-05, "epoch": 0.8480899877491925, "percentage": 4.24, "elapsed_time": "0:46:09", "remaining_time": "17:22:11", "throughput": 3348.72, "total_tokens": 9272768} +{"current_steps": 7620, "total_steps": 179580, "loss": 0.0888, "lr": 2.1213386791402162e-05, "epoch": 0.8486468426328099, "percentage": 4.24, "elapsed_time": "0:46:10", "remaining_time": "17:22:10", "throughput": 3348.71, "total_tokens": 9278880} +{"current_steps": 7625, "total_steps": 179580, "loss": 0.1366, "lr": 2.1227308163492596e-05, "epoch": 0.8492036975164272, "percentage": 4.25, "elapsed_time": "0:46:12", "remaining_time": "17:22:08", "throughput": 3348.7, "total_tokens": 9284896} +{"current_steps": 7630, "total_steps": 179580, "loss": 0.3228, "lr": 2.124122953558303e-05, "epoch": 0.8497605524000446, "percentage": 4.25, "elapsed_time": "0:46:14", "remaining_time": "17:22:04", "throughput": 3348.7, "total_tokens": 9290720} +{"current_steps": 7635, "total_steps": 179580, "loss": 0.1261, "lr": 2.125515090767346e-05, "epoch": 0.8503174072836619, "percentage": 4.25, "elapsed_time": "0:46:16", "remaining_time": "17:22:01", "throughput": 3348.71, "total_tokens": 9296704} +{"current_steps": 7640, "total_steps": 179580, "loss": 0.2429, "lr": 2.1269072279763893e-05, "epoch": 0.8508742621672792, "percentage": 4.25, "elapsed_time": "0:46:18", "remaining_time": "17:22:01", "throughput": 3348.73, "total_tokens": 9303136} +{"current_steps": 7645, "total_steps": 179580, "loss": 0.204, "lr": 2.1282993651854327e-05, "epoch": 0.8514311170508966, "percentage": 4.26, "elapsed_time": "0:46:19", "remaining_time": "17:22:00", "throughput": 3348.64, "total_tokens": 9309024} +{"current_steps": 7650, "total_steps": 179580, "loss": 0.0856, "lr": 2.129691502394476e-05, "epoch": 0.8519879719345138, "percentage": 4.26, "elapsed_time": "0:46:21", "remaining_time": "17:21:58", "throughput": 3348.61, "total_tokens": 9315072} +{"current_steps": 7655, "total_steps": 179580, "loss": 0.1791, "lr": 2.1310836396035196e-05, "epoch": 0.8525448268181312, "percentage": 4.26, "elapsed_time": "0:46:23", "remaining_time": "17:21:57", "throughput": 3348.61, "total_tokens": 9321216} +{"current_steps": 7660, "total_steps": 179580, "loss": 0.1498, "lr": 2.1324757768125626e-05, "epoch": 0.8531016817017485, "percentage": 4.27, "elapsed_time": "0:46:25", "remaining_time": "17:21:55", "throughput": 3348.59, "total_tokens": 9327200} +{"current_steps": 7665, "total_steps": 179580, "loss": 0.2484, "lr": 2.133867914021606e-05, "epoch": 0.8536585365853658, "percentage": 4.27, "elapsed_time": "0:46:27", "remaining_time": "17:21:52", "throughput": 3348.59, "total_tokens": 9333056} +{"current_steps": 7670, "total_steps": 179580, "loss": 0.3066, "lr": 2.1352600512306495e-05, "epoch": 0.8542153914689832, "percentage": 4.27, "elapsed_time": "0:46:29", "remaining_time": "17:21:51", "throughput": 3348.6, "total_tokens": 9339424} +{"current_steps": 7675, "total_steps": 179580, "loss": 0.1595, "lr": 2.136652188439693e-05, "epoch": 0.8547722463526005, "percentage": 4.27, "elapsed_time": "0:46:30", "remaining_time": "17:21:49", "throughput": 3348.58, "total_tokens": 9345376} +{"current_steps": 7680, "total_steps": 179580, "loss": 0.1998, "lr": 2.138044325648736e-05, "epoch": 0.8553291012362179, "percentage": 4.28, "elapsed_time": "0:46:32", "remaining_time": "17:21:49", "throughput": 3348.63, "total_tokens": 9351808} +{"current_steps": 7685, "total_steps": 179580, "loss": 0.1834, "lr": 2.139436462857779e-05, "epoch": 0.8558859561198352, "percentage": 4.28, "elapsed_time": "0:46:34", "remaining_time": "17:21:46", "throughput": 3348.61, "total_tokens": 9357696} +{"current_steps": 7690, "total_steps": 179580, "loss": 0.2438, "lr": 2.1408286000668226e-05, "epoch": 0.8564428110034525, "percentage": 4.28, "elapsed_time": "0:46:36", "remaining_time": "17:21:44", "throughput": 3348.61, "total_tokens": 9363712} +{"current_steps": 7695, "total_steps": 179580, "loss": 0.1457, "lr": 2.142220737275866e-05, "epoch": 0.8569996658870699, "percentage": 4.28, "elapsed_time": "0:46:38", "remaining_time": "17:21:43", "throughput": 3348.59, "total_tokens": 9369888} +{"current_steps": 7700, "total_steps": 179580, "loss": 0.1926, "lr": 2.1436128744849094e-05, "epoch": 0.8575565207706871, "percentage": 4.29, "elapsed_time": "0:46:39", "remaining_time": "17:21:40", "throughput": 3348.57, "total_tokens": 9375840} +{"current_steps": 7705, "total_steps": 179580, "loss": 0.1774, "lr": 2.1450050116939525e-05, "epoch": 0.8581133756543045, "percentage": 4.29, "elapsed_time": "0:46:41", "remaining_time": "17:21:37", "throughput": 3348.52, "total_tokens": 9381600} +{"current_steps": 7710, "total_steps": 179580, "loss": 0.1107, "lr": 2.146397148902996e-05, "epoch": 0.8586702305379218, "percentage": 4.29, "elapsed_time": "0:46:43", "remaining_time": "17:21:37", "throughput": 3348.52, "total_tokens": 9387936} +{"current_steps": 7715, "total_steps": 179580, "loss": 0.2454, "lr": 2.1477892861120394e-05, "epoch": 0.8592270854215391, "percentage": 4.3, "elapsed_time": "0:46:45", "remaining_time": "17:21:35", "throughput": 3348.53, "total_tokens": 9394016} +{"current_steps": 7720, "total_steps": 179580, "loss": 0.0937, "lr": 2.1491814233210828e-05, "epoch": 0.8597839403051565, "percentage": 4.3, "elapsed_time": "0:46:47", "remaining_time": "17:21:32", "throughput": 3348.51, "total_tokens": 9399904} +{"current_steps": 7725, "total_steps": 179580, "loss": 0.2323, "lr": 2.150573560530126e-05, "epoch": 0.8603407951887738, "percentage": 4.3, "elapsed_time": "0:46:49", "remaining_time": "17:21:33", "throughput": 3348.53, "total_tokens": 9406400} +{"current_steps": 7730, "total_steps": 179580, "loss": 0.1312, "lr": 2.151965697739169e-05, "epoch": 0.8608976500723912, "percentage": 4.3, "elapsed_time": "0:46:50", "remaining_time": "17:21:32", "throughput": 3348.56, "total_tokens": 9412768} +{"current_steps": 7735, "total_steps": 179580, "loss": 0.1857, "lr": 2.1533578349482124e-05, "epoch": 0.8614545049560085, "percentage": 4.31, "elapsed_time": "0:46:52", "remaining_time": "17:21:30", "throughput": 3348.55, "total_tokens": 9418752} +{"current_steps": 7740, "total_steps": 179580, "loss": 0.2294, "lr": 2.154749972157256e-05, "epoch": 0.8620113598396258, "percentage": 4.31, "elapsed_time": "0:46:54", "remaining_time": "17:21:25", "throughput": 3348.54, "total_tokens": 9424352} +{"current_steps": 7745, "total_steps": 179580, "loss": 0.1931, "lr": 2.1561421093662993e-05, "epoch": 0.8625682147232431, "percentage": 4.31, "elapsed_time": "0:46:56", "remaining_time": "17:21:23", "throughput": 3348.53, "total_tokens": 9430464} +{"current_steps": 7750, "total_steps": 179580, "loss": 0.2546, "lr": 2.1575342465753427e-05, "epoch": 0.8631250696068604, "percentage": 4.32, "elapsed_time": "0:46:58", "remaining_time": "17:21:21", "throughput": 3348.54, "total_tokens": 9436448} +{"current_steps": 7755, "total_steps": 179580, "loss": 0.1353, "lr": 2.158926383784386e-05, "epoch": 0.8636819244904778, "percentage": 4.32, "elapsed_time": "0:46:59", "remaining_time": "17:21:20", "throughput": 3348.56, "total_tokens": 9442656} +{"current_steps": 7760, "total_steps": 179580, "loss": 0.2065, "lr": 2.1603185209934293e-05, "epoch": 0.8642387793740951, "percentage": 4.32, "elapsed_time": "0:47:01", "remaining_time": "17:21:17", "throughput": 3348.53, "total_tokens": 9448480} +{"current_steps": 7765, "total_steps": 179580, "loss": 0.169, "lr": 2.1617106582024727e-05, "epoch": 0.8647956342577124, "percentage": 4.32, "elapsed_time": "0:47:03", "remaining_time": "17:21:13", "throughput": 3348.55, "total_tokens": 9454336} +{"current_steps": 7770, "total_steps": 179580, "loss": 0.1917, "lr": 2.1631027954115158e-05, "epoch": 0.8653524891413298, "percentage": 4.33, "elapsed_time": "0:47:05", "remaining_time": "17:21:14", "throughput": 3348.57, "total_tokens": 9460896} +{"current_steps": 7775, "total_steps": 179580, "loss": 0.2518, "lr": 2.1644949326205592e-05, "epoch": 0.8659093440249471, "percentage": 4.33, "elapsed_time": "0:47:07", "remaining_time": "17:21:11", "throughput": 3348.52, "total_tokens": 9466688} +{"current_steps": 7780, "total_steps": 179580, "loss": 0.0614, "lr": 2.1658870698296023e-05, "epoch": 0.8664661989085645, "percentage": 4.33, "elapsed_time": "0:47:09", "remaining_time": "17:21:11", "throughput": 3348.52, "total_tokens": 9473024} +{"current_steps": 7785, "total_steps": 179580, "loss": 0.169, "lr": 2.1672792070386458e-05, "epoch": 0.8670230537921818, "percentage": 4.34, "elapsed_time": "0:47:10", "remaining_time": "17:21:09", "throughput": 3348.51, "total_tokens": 9479104} +{"current_steps": 7790, "total_steps": 179580, "loss": 0.203, "lr": 2.1686713442476892e-05, "epoch": 0.867579908675799, "percentage": 4.34, "elapsed_time": "0:47:12", "remaining_time": "17:21:08", "throughput": 3348.55, "total_tokens": 9485504} +{"current_steps": 7795, "total_steps": 179580, "loss": 0.1064, "lr": 2.1700634814567326e-05, "epoch": 0.8681367635594164, "percentage": 4.34, "elapsed_time": "0:47:14", "remaining_time": "17:21:09", "throughput": 3348.56, "total_tokens": 9491968} +{"current_steps": 7800, "total_steps": 179580, "loss": 0.19, "lr": 2.1714556186657757e-05, "epoch": 0.8686936184430337, "percentage": 4.34, "elapsed_time": "0:47:16", "remaining_time": "17:21:06", "throughput": 3348.54, "total_tokens": 9497888} +{"current_steps": 7805, "total_steps": 179580, "loss": 0.2014, "lr": 2.172847755874819e-05, "epoch": 0.8692504733266511, "percentage": 4.35, "elapsed_time": "0:47:18", "remaining_time": "17:21:04", "throughput": 3348.55, "total_tokens": 9503872} +{"current_steps": 7810, "total_steps": 179580, "loss": 0.1946, "lr": 2.1742398930838626e-05, "epoch": 0.8698073282102684, "percentage": 4.35, "elapsed_time": "0:47:19", "remaining_time": "17:20:59", "throughput": 3348.56, "total_tokens": 9509568} +{"current_steps": 7815, "total_steps": 179580, "loss": 0.1147, "lr": 2.175632030292906e-05, "epoch": 0.8703641830938857, "percentage": 4.35, "elapsed_time": "0:47:21", "remaining_time": "17:20:57", "throughput": 3348.55, "total_tokens": 9515584} +{"current_steps": 7820, "total_steps": 179580, "loss": 0.1651, "lr": 2.177024167501949e-05, "epoch": 0.8709210379775031, "percentage": 4.35, "elapsed_time": "0:47:23", "remaining_time": "17:20:53", "throughput": 3348.5, "total_tokens": 9521248} +{"current_steps": 7825, "total_steps": 179580, "loss": 0.1401, "lr": 2.1784163047109922e-05, "epoch": 0.8714778928611204, "percentage": 4.36, "elapsed_time": "0:47:25", "remaining_time": "17:20:54", "throughput": 3348.5, "total_tokens": 9527680} +{"current_steps": 7830, "total_steps": 179580, "loss": 0.1687, "lr": 2.1798084419200356e-05, "epoch": 0.8720347477447378, "percentage": 4.36, "elapsed_time": "0:47:27", "remaining_time": "17:20:51", "throughput": 3348.48, "total_tokens": 9533632} +{"current_steps": 7835, "total_steps": 179580, "loss": 0.1458, "lr": 2.181200579129079e-05, "epoch": 0.872591602628355, "percentage": 4.36, "elapsed_time": "0:47:29", "remaining_time": "17:20:51", "throughput": 3348.5, "total_tokens": 9539968} +{"current_steps": 7840, "total_steps": 179580, "loss": 0.2578, "lr": 2.1825927163381225e-05, "epoch": 0.8731484575119723, "percentage": 4.37, "elapsed_time": "0:47:30", "remaining_time": "17:20:49", "throughput": 3348.47, "total_tokens": 9545984} +{"current_steps": 7845, "total_steps": 179580, "loss": 0.2032, "lr": 2.1839848535471656e-05, "epoch": 0.8737053123955897, "percentage": 4.37, "elapsed_time": "0:47:32", "remaining_time": "17:20:48", "throughput": 3348.48, "total_tokens": 9552256} +{"current_steps": 7850, "total_steps": 179580, "loss": 0.2748, "lr": 2.185376990756209e-05, "epoch": 0.874262167279207, "percentage": 4.37, "elapsed_time": "0:47:34", "remaining_time": "17:20:47", "throughput": 3348.49, "total_tokens": 9558464} +{"current_steps": 7855, "total_steps": 179580, "loss": 0.2523, "lr": 2.1867691279652525e-05, "epoch": 0.8748190221628244, "percentage": 4.37, "elapsed_time": "0:47:36", "remaining_time": "17:20:45", "throughput": 3348.49, "total_tokens": 9564480} +{"current_steps": 7860, "total_steps": 179580, "loss": 0.1652, "lr": 2.188161265174296e-05, "epoch": 0.8753758770464417, "percentage": 4.38, "elapsed_time": "0:47:38", "remaining_time": "17:20:43", "throughput": 3348.5, "total_tokens": 9570656} +{"current_steps": 7865, "total_steps": 179580, "loss": 0.2187, "lr": 2.189553402383339e-05, "epoch": 0.875932731930059, "percentage": 4.38, "elapsed_time": "0:47:39", "remaining_time": "17:20:41", "throughput": 3348.48, "total_tokens": 9576544} +{"current_steps": 7870, "total_steps": 179580, "loss": 0.1388, "lr": 2.190945539592382e-05, "epoch": 0.8764895868136764, "percentage": 4.38, "elapsed_time": "0:47:41", "remaining_time": "17:20:40", "throughput": 3348.48, "total_tokens": 9582784} +{"current_steps": 7875, "total_steps": 179580, "loss": 0.192, "lr": 2.1923376768014255e-05, "epoch": 0.8770464416972937, "percentage": 4.39, "elapsed_time": "0:47:43", "remaining_time": "17:20:41", "throughput": 3348.52, "total_tokens": 9589440} +{"current_steps": 7880, "total_steps": 179580, "loss": 0.2669, "lr": 2.193729814010469e-05, "epoch": 0.877603296580911, "percentage": 4.39, "elapsed_time": "0:47:45", "remaining_time": "17:20:39", "throughput": 3348.54, "total_tokens": 9595552} +{"current_steps": 7885, "total_steps": 179580, "loss": 0.329, "lr": 2.1951219512195124e-05, "epoch": 0.8781601514645283, "percentage": 4.39, "elapsed_time": "0:47:47", "remaining_time": "17:20:38", "throughput": 3348.52, "total_tokens": 9601792} +{"current_steps": 7890, "total_steps": 179580, "loss": 0.1253, "lr": 2.1965140884285558e-05, "epoch": 0.8787170063481456, "percentage": 4.39, "elapsed_time": "0:47:49", "remaining_time": "17:20:33", "throughput": 3348.52, "total_tokens": 9607296} +{"current_steps": 7895, "total_steps": 179580, "loss": 0.1562, "lr": 2.197906225637599e-05, "epoch": 0.879273861231763, "percentage": 4.4, "elapsed_time": "0:47:50", "remaining_time": "17:20:31", "throughput": 3348.54, "total_tokens": 9613504} +{"current_steps": 7900, "total_steps": 179580, "loss": 0.1098, "lr": 2.1992983628466423e-05, "epoch": 0.8798307161153803, "percentage": 4.4, "elapsed_time": "0:47:52", "remaining_time": "17:20:31", "throughput": 3348.56, "total_tokens": 9619936} +{"current_steps": 7905, "total_steps": 179580, "loss": 0.1721, "lr": 2.2006905000556858e-05, "epoch": 0.8803875709989977, "percentage": 4.4, "elapsed_time": "0:47:54", "remaining_time": "17:20:30", "throughput": 3348.58, "total_tokens": 9626080} +{"current_steps": 7910, "total_steps": 179580, "loss": 0.2215, "lr": 2.202082637264729e-05, "epoch": 0.880944425882615, "percentage": 4.4, "elapsed_time": "0:47:56", "remaining_time": "17:20:29", "throughput": 3348.6, "total_tokens": 9632352} +{"current_steps": 7915, "total_steps": 179580, "loss": 0.2808, "lr": 2.2034747744737723e-05, "epoch": 0.8815012807662324, "percentage": 4.41, "elapsed_time": "0:47:58", "remaining_time": "17:20:26", "throughput": 3348.57, "total_tokens": 9638240} +{"current_steps": 7920, "total_steps": 179580, "loss": 0.2137, "lr": 2.2048669116828154e-05, "epoch": 0.8820581356498497, "percentage": 4.41, "elapsed_time": "0:48:00", "remaining_time": "17:20:26", "throughput": 3348.59, "total_tokens": 9644640} +{"current_steps": 7925, "total_steps": 179580, "loss": 0.2544, "lr": 2.2062590488918588e-05, "epoch": 0.8826149905334669, "percentage": 4.41, "elapsed_time": "0:48:02", "remaining_time": "17:20:24", "throughput": 3348.59, "total_tokens": 9650720} +{"current_steps": 7930, "total_steps": 179580, "loss": 0.0984, "lr": 2.2076511861009023e-05, "epoch": 0.8831718454170843, "percentage": 4.42, "elapsed_time": "0:48:03", "remaining_time": "17:20:21", "throughput": 3348.56, "total_tokens": 9656544} +{"current_steps": 7935, "total_steps": 179580, "loss": 0.2044, "lr": 2.2090433233099457e-05, "epoch": 0.8837287003007016, "percentage": 4.42, "elapsed_time": "0:48:05", "remaining_time": "17:20:20", "throughput": 3348.57, "total_tokens": 9662752} +{"current_steps": 7940, "total_steps": 179580, "loss": 0.2288, "lr": 2.2104354605189888e-05, "epoch": 0.884285555184319, "percentage": 4.42, "elapsed_time": "0:48:07", "remaining_time": "17:20:15", "throughput": 3348.55, "total_tokens": 9668320} +{"current_steps": 7945, "total_steps": 179580, "loss": 0.0991, "lr": 2.2118275977280322e-05, "epoch": 0.8848424100679363, "percentage": 4.42, "elapsed_time": "0:48:09", "remaining_time": "17:20:13", "throughput": 3348.57, "total_tokens": 9674432} +{"current_steps": 7950, "total_steps": 179580, "loss": 0.1489, "lr": 2.2132197349370757e-05, "epoch": 0.8853992649515536, "percentage": 4.43, "elapsed_time": "0:48:10", "remaining_time": "17:20:12", "throughput": 3348.58, "total_tokens": 9680640} +{"current_steps": 7955, "total_steps": 179580, "loss": 0.1078, "lr": 2.2146118721461187e-05, "epoch": 0.885956119835171, "percentage": 4.43, "elapsed_time": "0:48:12", "remaining_time": "17:20:11", "throughput": 3348.58, "total_tokens": 9686880} +{"current_steps": 7960, "total_steps": 179580, "loss": 0.0899, "lr": 2.2160040093551622e-05, "epoch": 0.8865129747187883, "percentage": 4.43, "elapsed_time": "0:48:14", "remaining_time": "17:20:09", "throughput": 3348.57, "total_tokens": 9692928} +{"current_steps": 7965, "total_steps": 179580, "loss": 0.0996, "lr": 2.2173961465642053e-05, "epoch": 0.8870698296024057, "percentage": 4.44, "elapsed_time": "0:48:16", "remaining_time": "17:20:07", "throughput": 3348.56, "total_tokens": 9698944} +{"current_steps": 7970, "total_steps": 179580, "loss": 0.2382, "lr": 2.2187882837732487e-05, "epoch": 0.8876266844860229, "percentage": 4.44, "elapsed_time": "0:48:18", "remaining_time": "17:20:05", "throughput": 3348.56, "total_tokens": 9705088} +{"current_steps": 7975, "total_steps": 179580, "loss": 0.1053, "lr": 2.220180420982292e-05, "epoch": 0.8881835393696402, "percentage": 4.44, "elapsed_time": "0:48:20", "remaining_time": "17:20:03", "throughput": 3348.54, "total_tokens": 9711072} +{"current_steps": 7980, "total_steps": 179580, "loss": 0.1143, "lr": 2.2215725581913356e-05, "epoch": 0.8887403942532576, "percentage": 4.44, "elapsed_time": "0:48:21", "remaining_time": "17:20:03", "throughput": 3348.56, "total_tokens": 9717408} +{"current_steps": 7985, "total_steps": 179580, "loss": 0.1792, "lr": 2.2229646954003787e-05, "epoch": 0.8892972491368749, "percentage": 4.45, "elapsed_time": "0:48:23", "remaining_time": "17:20:02", "throughput": 3348.55, "total_tokens": 9723584} +{"current_steps": 7990, "total_steps": 179580, "loss": 0.2341, "lr": 2.224356832609422e-05, "epoch": 0.8898541040204923, "percentage": 4.45, "elapsed_time": "0:48:25", "remaining_time": "17:20:00", "throughput": 3348.55, "total_tokens": 9729760} +{"current_steps": 7995, "total_steps": 179580, "loss": 0.1784, "lr": 2.2257489698184655e-05, "epoch": 0.8904109589041096, "percentage": 4.45, "elapsed_time": "0:48:27", "remaining_time": "17:19:59", "throughput": 3348.52, "total_tokens": 9735776} +{"current_steps": 8000, "total_steps": 179580, "loss": 0.0901, "lr": 2.2271411070275086e-05, "epoch": 0.8909678137877269, "percentage": 4.45, "elapsed_time": "0:48:29", "remaining_time": "17:19:57", "throughput": 3348.49, "total_tokens": 9741824} +{"current_steps": 8005, "total_steps": 179580, "loss": 0.0689, "lr": 2.228533244236552e-05, "epoch": 0.8915246686713443, "percentage": 4.46, "elapsed_time": "0:48:31", "remaining_time": "17:19:52", "throughput": 3348.46, "total_tokens": 9747392} +{"current_steps": 8010, "total_steps": 179580, "loss": 0.198, "lr": 2.229925381445595e-05, "epoch": 0.8920815235549616, "percentage": 4.46, "elapsed_time": "0:48:32", "remaining_time": "17:19:52", "throughput": 3348.47, "total_tokens": 9753696} +{"current_steps": 8015, "total_steps": 179580, "loss": 0.1949, "lr": 2.2313175186546386e-05, "epoch": 0.892638378438579, "percentage": 4.46, "elapsed_time": "0:48:34", "remaining_time": "17:19:50", "throughput": 3348.49, "total_tokens": 9759904} +{"current_steps": 8020, "total_steps": 179580, "loss": 0.156, "lr": 2.232709655863682e-05, "epoch": 0.8931952333221962, "percentage": 4.47, "elapsed_time": "0:48:36", "remaining_time": "17:19:49", "throughput": 3348.49, "total_tokens": 9765984} +{"current_steps": 8025, "total_steps": 179580, "loss": 0.2565, "lr": 2.2341017930727255e-05, "epoch": 0.8937520882058135, "percentage": 4.47, "elapsed_time": "0:48:38", "remaining_time": "17:19:48", "throughput": 3348.5, "total_tokens": 9772256} +{"current_steps": 8030, "total_steps": 179580, "loss": 0.2046, "lr": 2.235493930281769e-05, "epoch": 0.8943089430894309, "percentage": 4.47, "elapsed_time": "0:48:40", "remaining_time": "17:19:45", "throughput": 3348.47, "total_tokens": 9778144} +{"current_steps": 8035, "total_steps": 179580, "loss": 0.1476, "lr": 2.236886067490812e-05, "epoch": 0.8948657979730482, "percentage": 4.47, "elapsed_time": "0:48:42", "remaining_time": "17:19:46", "throughput": 3348.5, "total_tokens": 9784704} +{"current_steps": 8040, "total_steps": 179580, "loss": 0.1403, "lr": 2.2382782046998554e-05, "epoch": 0.8954226528566656, "percentage": 4.48, "elapsed_time": "0:48:43", "remaining_time": "17:19:44", "throughput": 3348.52, "total_tokens": 9790912} +{"current_steps": 8045, "total_steps": 179580, "loss": 0.2259, "lr": 2.2396703419088985e-05, "epoch": 0.8959795077402829, "percentage": 4.48, "elapsed_time": "0:48:45", "remaining_time": "17:19:42", "throughput": 3348.54, "total_tokens": 9796928} +{"current_steps": 8050, "total_steps": 179580, "loss": 0.3391, "lr": 2.241062479117942e-05, "epoch": 0.8965363626239002, "percentage": 4.48, "elapsed_time": "0:48:47", "remaining_time": "17:19:40", "throughput": 3348.52, "total_tokens": 9803008} +{"current_steps": 8055, "total_steps": 179580, "loss": 0.182, "lr": 2.2424546163269854e-05, "epoch": 0.8970932175075176, "percentage": 4.49, "elapsed_time": "0:48:49", "remaining_time": "17:19:40", "throughput": 3348.51, "total_tokens": 9809280} +{"current_steps": 8060, "total_steps": 179580, "loss": 0.1692, "lr": 2.2438467535360285e-05, "epoch": 0.8976500723911349, "percentage": 4.49, "elapsed_time": "0:48:51", "remaining_time": "17:19:36", "throughput": 3348.49, "total_tokens": 9815008} +{"current_steps": 8065, "total_steps": 179580, "loss": 0.1405, "lr": 2.245238890745072e-05, "epoch": 0.8982069272747522, "percentage": 4.49, "elapsed_time": "0:48:53", "remaining_time": "17:19:34", "throughput": 3348.48, "total_tokens": 9821120} +{"current_steps": 8070, "total_steps": 179580, "loss": 0.1773, "lr": 2.2466310279541153e-05, "epoch": 0.8987637821583695, "percentage": 4.49, "elapsed_time": "0:48:54", "remaining_time": "17:19:32", "throughput": 3348.5, "total_tokens": 9827232} +{"current_steps": 8075, "total_steps": 179580, "loss": 0.2858, "lr": 2.2480231651631588e-05, "epoch": 0.8993206370419868, "percentage": 4.5, "elapsed_time": "0:48:56", "remaining_time": "17:19:31", "throughput": 3348.51, "total_tokens": 9833376} +{"current_steps": 8080, "total_steps": 179580, "loss": 0.0998, "lr": 2.249415302372202e-05, "epoch": 0.8998774919256042, "percentage": 4.5, "elapsed_time": "0:48:58", "remaining_time": "17:19:32", "throughput": 3348.54, "total_tokens": 9839936} +{"current_steps": 8085, "total_steps": 179580, "loss": 0.2102, "lr": 2.2508074395812453e-05, "epoch": 0.9004343468092215, "percentage": 4.5, "elapsed_time": "0:49:00", "remaining_time": "17:19:32", "throughput": 3348.57, "total_tokens": 9846496} +{"current_steps": 8090, "total_steps": 179580, "loss": 0.1513, "lr": 2.2521995767902884e-05, "epoch": 0.9009912016928389, "percentage": 4.5, "elapsed_time": "0:49:02", "remaining_time": "17:19:31", "throughput": 3348.56, "total_tokens": 9852736} +{"current_steps": 8095, "total_steps": 179580, "loss": 0.1608, "lr": 2.2535917139993318e-05, "epoch": 0.9015480565764562, "percentage": 4.51, "elapsed_time": "0:49:04", "remaining_time": "17:19:33", "throughput": 3348.59, "total_tokens": 9859456} +{"current_steps": 8100, "total_steps": 179580, "loss": 0.212, "lr": 2.2549838512083753e-05, "epoch": 0.9021049114600735, "percentage": 4.51, "elapsed_time": "0:49:06", "remaining_time": "17:19:29", "throughput": 3348.57, "total_tokens": 9865152} +{"current_steps": 8105, "total_steps": 179580, "loss": 0.0806, "lr": 2.2563759884174183e-05, "epoch": 0.9026617663436909, "percentage": 4.51, "elapsed_time": "0:49:07", "remaining_time": "17:19:27", "throughput": 3348.57, "total_tokens": 9871200} +{"current_steps": 8110, "total_steps": 179580, "loss": 0.119, "lr": 2.2577681256264618e-05, "epoch": 0.9032186212273081, "percentage": 4.52, "elapsed_time": "0:49:09", "remaining_time": "17:19:27", "throughput": 3348.6, "total_tokens": 9877664} +{"current_steps": 8115, "total_steps": 179580, "loss": 0.1636, "lr": 2.2591602628355052e-05, "epoch": 0.9037754761109255, "percentage": 4.52, "elapsed_time": "0:49:11", "remaining_time": "17:19:26", "throughput": 3348.63, "total_tokens": 9883936} +{"current_steps": 8120, "total_steps": 179580, "loss": 0.1461, "lr": 2.2605524000445486e-05, "epoch": 0.9043323309945428, "percentage": 4.52, "elapsed_time": "0:49:13", "remaining_time": "17:19:24", "throughput": 3348.64, "total_tokens": 9890144} +{"current_steps": 8125, "total_steps": 179580, "loss": 0.1114, "lr": 2.2619445372535917e-05, "epoch": 0.9048891858781601, "percentage": 4.52, "elapsed_time": "0:49:15", "remaining_time": "17:19:21", "throughput": 3348.65, "total_tokens": 9895968} +{"current_steps": 8130, "total_steps": 179580, "loss": 0.2894, "lr": 2.2633366744626352e-05, "epoch": 0.9054460407617775, "percentage": 4.53, "elapsed_time": "0:49:17", "remaining_time": "17:19:19", "throughput": 3348.64, "total_tokens": 9901984} +{"current_steps": 8135, "total_steps": 179580, "loss": 0.1387, "lr": 2.2647288116716786e-05, "epoch": 0.9060028956453948, "percentage": 4.53, "elapsed_time": "0:49:18", "remaining_time": "17:19:17", "throughput": 3348.67, "total_tokens": 9908128} +{"current_steps": 8140, "total_steps": 179580, "loss": 0.1479, "lr": 2.2661209488807217e-05, "epoch": 0.9065597505290122, "percentage": 4.53, "elapsed_time": "0:49:20", "remaining_time": "17:19:15", "throughput": 3348.66, "total_tokens": 9914208} +{"current_steps": 8145, "total_steps": 179580, "loss": 0.2305, "lr": 2.267513086089765e-05, "epoch": 0.9071166054126295, "percentage": 4.54, "elapsed_time": "0:49:22", "remaining_time": "17:19:14", "throughput": 3348.65, "total_tokens": 9920480} +{"current_steps": 8150, "total_steps": 179580, "loss": 0.246, "lr": 2.2689052232988082e-05, "epoch": 0.9076734602962468, "percentage": 4.54, "elapsed_time": "0:49:24", "remaining_time": "17:19:14", "throughput": 3348.67, "total_tokens": 9926816} +{"current_steps": 8155, "total_steps": 179580, "loss": 0.2182, "lr": 2.2702973605078517e-05, "epoch": 0.9082303151798641, "percentage": 4.54, "elapsed_time": "0:49:26", "remaining_time": "17:19:13", "throughput": 3348.69, "total_tokens": 9933120} +{"current_steps": 8160, "total_steps": 179580, "loss": 0.1144, "lr": 2.271689497716895e-05, "epoch": 0.9087871700634814, "percentage": 4.54, "elapsed_time": "0:49:28", "remaining_time": "17:19:11", "throughput": 3348.66, "total_tokens": 9939072} +{"current_steps": 8165, "total_steps": 179580, "loss": 0.2408, "lr": 2.2730816349259385e-05, "epoch": 0.9093440249470988, "percentage": 4.55, "elapsed_time": "0:49:29", "remaining_time": "17:19:09", "throughput": 3348.64, "total_tokens": 9945024} +{"current_steps": 8170, "total_steps": 179580, "loss": 0.1364, "lr": 2.274473772134982e-05, "epoch": 0.9099008798307161, "percentage": 4.55, "elapsed_time": "0:49:31", "remaining_time": "17:19:07", "throughput": 3348.63, "total_tokens": 9951104} +{"current_steps": 8175, "total_steps": 179580, "loss": 0.2056, "lr": 2.275865909344025e-05, "epoch": 0.9104577347143334, "percentage": 4.55, "elapsed_time": "0:49:33", "remaining_time": "17:19:05", "throughput": 3348.61, "total_tokens": 9957088} +{"current_steps": 8180, "total_steps": 179580, "loss": 0.1714, "lr": 2.2772580465530685e-05, "epoch": 0.9110145895979508, "percentage": 4.56, "elapsed_time": "0:49:35", "remaining_time": "17:19:03", "throughput": 3348.59, "total_tokens": 9963072} +{"current_steps": 8185, "total_steps": 179580, "loss": 0.3199, "lr": 2.2786501837621116e-05, "epoch": 0.9115714444815681, "percentage": 4.56, "elapsed_time": "0:49:37", "remaining_time": "17:19:02", "throughput": 3348.59, "total_tokens": 9969280} +{"current_steps": 8190, "total_steps": 179580, "loss": 0.2734, "lr": 2.280042320971155e-05, "epoch": 0.9121282993651855, "percentage": 4.56, "elapsed_time": "0:49:38", "remaining_time": "17:18:59", "throughput": 3348.58, "total_tokens": 9975296} +{"current_steps": 8195, "total_steps": 179580, "loss": 0.2752, "lr": 2.2814344581801984e-05, "epoch": 0.9126851542488028, "percentage": 4.56, "elapsed_time": "0:49:40", "remaining_time": "17:18:57", "throughput": 3348.59, "total_tokens": 9981376} +{"current_steps": 8200, "total_steps": 179580, "loss": 0.1705, "lr": 2.2828265953892415e-05, "epoch": 0.91324200913242, "percentage": 4.57, "elapsed_time": "0:49:42", "remaining_time": "17:18:55", "throughput": 3348.58, "total_tokens": 9987392} +{"current_steps": 8205, "total_steps": 179580, "loss": 0.214, "lr": 2.284218732598285e-05, "epoch": 0.9137988640160374, "percentage": 4.57, "elapsed_time": "0:49:44", "remaining_time": "17:18:53", "throughput": 3348.56, "total_tokens": 9993344} +{"current_steps": 8210, "total_steps": 179580, "loss": 0.1333, "lr": 2.2856108698073284e-05, "epoch": 0.9143557188996547, "percentage": 4.57, "elapsed_time": "0:49:46", "remaining_time": "17:18:52", "throughput": 3348.56, "total_tokens": 9999520} +{"current_steps": 8215, "total_steps": 179580, "loss": 0.058, "lr": 2.287003007016372e-05, "epoch": 0.9149125737832721, "percentage": 4.57, "elapsed_time": "0:49:47", "remaining_time": "17:18:49", "throughput": 3348.55, "total_tokens": 10005376} +{"current_steps": 8220, "total_steps": 179580, "loss": 0.0832, "lr": 2.288395144225415e-05, "epoch": 0.9154694286668894, "percentage": 4.58, "elapsed_time": "0:49:49", "remaining_time": "17:18:47", "throughput": 3348.55, "total_tokens": 10011424} +{"current_steps": 8225, "total_steps": 179580, "loss": 0.124, "lr": 2.2897872814344584e-05, "epoch": 0.9160262835505067, "percentage": 4.58, "elapsed_time": "0:49:51", "remaining_time": "17:18:45", "throughput": 3348.58, "total_tokens": 10017600} +{"current_steps": 8230, "total_steps": 179580, "loss": 0.2088, "lr": 2.2911794186435015e-05, "epoch": 0.9165831384341241, "percentage": 4.58, "elapsed_time": "0:49:53", "remaining_time": "17:18:41", "throughput": 3348.56, "total_tokens": 10023264} +{"current_steps": 8235, "total_steps": 179580, "loss": 0.1766, "lr": 2.292571555852545e-05, "epoch": 0.9171399933177414, "percentage": 4.59, "elapsed_time": "0:49:55", "remaining_time": "17:18:39", "throughput": 3348.56, "total_tokens": 10029312} +{"current_steps": 8240, "total_steps": 179580, "loss": 0.0494, "lr": 2.2939636930615883e-05, "epoch": 0.9176968482013588, "percentage": 4.59, "elapsed_time": "0:49:57", "remaining_time": "17:18:39", "throughput": 3348.58, "total_tokens": 10035776} +{"current_steps": 8245, "total_steps": 179580, "loss": 0.1329, "lr": 2.2953558302706314e-05, "epoch": 0.918253703084976, "percentage": 4.59, "elapsed_time": "0:49:58", "remaining_time": "17:18:36", "throughput": 3348.55, "total_tokens": 10041632} +{"current_steps": 8250, "total_steps": 179580, "loss": 0.1464, "lr": 2.296747967479675e-05, "epoch": 0.9188105579685933, "percentage": 4.59, "elapsed_time": "0:50:00", "remaining_time": "17:18:33", "throughput": 3348.55, "total_tokens": 10047584} +{"current_steps": 8255, "total_steps": 179580, "loss": 0.0983, "lr": 2.2981401046887183e-05, "epoch": 0.9193674128522107, "percentage": 4.6, "elapsed_time": "0:50:02", "remaining_time": "17:18:32", "throughput": 3348.56, "total_tokens": 10053760} +{"current_steps": 8260, "total_steps": 179580, "loss": 0.1087, "lr": 2.2995322418977617e-05, "epoch": 0.919924267735828, "percentage": 4.6, "elapsed_time": "0:50:04", "remaining_time": "17:18:29", "throughput": 3348.54, "total_tokens": 10059680} +{"current_steps": 8265, "total_steps": 179580, "loss": 0.2489, "lr": 2.3009243791068048e-05, "epoch": 0.9204811226194454, "percentage": 4.6, "elapsed_time": "0:50:06", "remaining_time": "17:18:28", "throughput": 3348.5, "total_tokens": 10065760} +{"current_steps": 8270, "total_steps": 179580, "loss": 0.2122, "lr": 2.3023165163158482e-05, "epoch": 0.9210379775030627, "percentage": 4.61, "elapsed_time": "0:50:07", "remaining_time": "17:18:25", "throughput": 3348.49, "total_tokens": 10071584} +{"current_steps": 8275, "total_steps": 179580, "loss": 0.0768, "lr": 2.3037086535248913e-05, "epoch": 0.92159483238668, "percentage": 4.61, "elapsed_time": "0:50:09", "remaining_time": "17:18:23", "throughput": 3348.48, "total_tokens": 10077664} +{"current_steps": 8280, "total_steps": 179580, "loss": 0.2047, "lr": 2.3051007907339348e-05, "epoch": 0.9221516872702974, "percentage": 4.61, "elapsed_time": "0:50:11", "remaining_time": "17:18:24", "throughput": 3348.48, "total_tokens": 10084192} +{"current_steps": 8285, "total_steps": 179580, "loss": 0.1375, "lr": 2.3064929279429782e-05, "epoch": 0.9227085421539147, "percentage": 4.61, "elapsed_time": "0:50:13", "remaining_time": "17:18:23", "throughput": 3348.46, "total_tokens": 10090336} +{"current_steps": 8290, "total_steps": 179580, "loss": 0.2865, "lr": 2.3078850651520213e-05, "epoch": 0.923265397037532, "percentage": 4.62, "elapsed_time": "0:50:15", "remaining_time": "17:18:22", "throughput": 3348.49, "total_tokens": 10096640} +{"current_steps": 8295, "total_steps": 179580, "loss": 0.1754, "lr": 2.3092772023610647e-05, "epoch": 0.9238222519211493, "percentage": 4.62, "elapsed_time": "0:50:17", "remaining_time": "17:18:18", "throughput": 3348.52, "total_tokens": 10102528} +{"current_steps": 8300, "total_steps": 179580, "loss": 0.168, "lr": 2.310669339570108e-05, "epoch": 0.9243791068047666, "percentage": 4.62, "elapsed_time": "0:50:18", "remaining_time": "17:18:16", "throughput": 3348.49, "total_tokens": 10108416} +{"current_steps": 8305, "total_steps": 179580, "loss": 0.0849, "lr": 2.3120614767791516e-05, "epoch": 0.924935961688384, "percentage": 4.62, "elapsed_time": "0:50:20", "remaining_time": "17:18:14", "throughput": 3348.54, "total_tokens": 10114624} +{"current_steps": 8310, "total_steps": 179580, "loss": 0.1013, "lr": 2.313453613988195e-05, "epoch": 0.9254928165720013, "percentage": 4.63, "elapsed_time": "0:50:22", "remaining_time": "17:18:12", "throughput": 3348.51, "total_tokens": 10120640} +{"current_steps": 8315, "total_steps": 179580, "loss": 0.0621, "lr": 2.314845751197238e-05, "epoch": 0.9260496714556187, "percentage": 4.63, "elapsed_time": "0:50:24", "remaining_time": "17:18:11", "throughput": 3348.53, "total_tokens": 10126976} +{"current_steps": 8320, "total_steps": 179580, "loss": 0.1465, "lr": 2.3162378884062812e-05, "epoch": 0.926606526339236, "percentage": 4.63, "elapsed_time": "0:50:26", "remaining_time": "17:18:11", "throughput": 3348.53, "total_tokens": 10133248} +{"current_steps": 8325, "total_steps": 179580, "loss": 0.1929, "lr": 2.3176300256153246e-05, "epoch": 0.9271633812228534, "percentage": 4.64, "elapsed_time": "0:50:28", "remaining_time": "17:18:10", "throughput": 3348.53, "total_tokens": 10139584} +{"current_steps": 8330, "total_steps": 179580, "loss": 0.0477, "lr": 2.319022162824368e-05, "epoch": 0.9277202361064707, "percentage": 4.64, "elapsed_time": "0:50:29", "remaining_time": "17:18:07", "throughput": 3348.54, "total_tokens": 10145376} +{"current_steps": 8335, "total_steps": 179580, "loss": 0.1576, "lr": 2.3204143000334115e-05, "epoch": 0.928277090990088, "percentage": 4.64, "elapsed_time": "0:50:31", "remaining_time": "17:18:06", "throughput": 3348.54, "total_tokens": 10151744} +{"current_steps": 8340, "total_steps": 179580, "loss": 0.1795, "lr": 2.3218064372424546e-05, "epoch": 0.9288339458737053, "percentage": 4.64, "elapsed_time": "0:50:33", "remaining_time": "17:18:03", "throughput": 3348.56, "total_tokens": 10157664} +{"current_steps": 8345, "total_steps": 179580, "loss": 0.1167, "lr": 2.323198574451498e-05, "epoch": 0.9293908007573226, "percentage": 4.65, "elapsed_time": "0:50:35", "remaining_time": "17:18:02", "throughput": 3348.54, "total_tokens": 10163712} +{"current_steps": 8350, "total_steps": 179580, "loss": 0.0944, "lr": 2.3245907116605415e-05, "epoch": 0.92994765564094, "percentage": 4.65, "elapsed_time": "0:50:37", "remaining_time": "17:17:59", "throughput": 3348.56, "total_tokens": 10169728} +{"current_steps": 8355, "total_steps": 179580, "loss": 0.3045, "lr": 2.325982848869585e-05, "epoch": 0.9305045105245573, "percentage": 4.65, "elapsed_time": "0:50:38", "remaining_time": "17:17:56", "throughput": 3348.56, "total_tokens": 10175680} +{"current_steps": 8360, "total_steps": 179580, "loss": 0.1002, "lr": 2.327374986078628e-05, "epoch": 0.9310613654081746, "percentage": 4.66, "elapsed_time": "0:50:40", "remaining_time": "17:17:54", "throughput": 3348.56, "total_tokens": 10181728} +{"current_steps": 8365, "total_steps": 179580, "loss": 0.1505, "lr": 2.328767123287671e-05, "epoch": 0.931618220291792, "percentage": 4.66, "elapsed_time": "0:50:42", "remaining_time": "17:17:52", "throughput": 3348.57, "total_tokens": 10187808} +{"current_steps": 8370, "total_steps": 179580, "loss": 0.2292, "lr": 2.3301592604967145e-05, "epoch": 0.9321750751754093, "percentage": 4.66, "elapsed_time": "0:50:44", "remaining_time": "17:17:51", "throughput": 3348.54, "total_tokens": 10193856} +{"current_steps": 8375, "total_steps": 179580, "loss": 0.2063, "lr": 2.331551397705758e-05, "epoch": 0.9327319300590267, "percentage": 4.66, "elapsed_time": "0:50:46", "remaining_time": "17:17:49", "throughput": 3348.53, "total_tokens": 10199968} +{"current_steps": 8380, "total_steps": 179580, "loss": 0.1524, "lr": 2.3329435349148014e-05, "epoch": 0.933288784942644, "percentage": 4.67, "elapsed_time": "0:50:47", "remaining_time": "17:17:46", "throughput": 3348.48, "total_tokens": 10205600} +{"current_steps": 8385, "total_steps": 179580, "loss": 0.1909, "lr": 2.3343356721238445e-05, "epoch": 0.9338456398262612, "percentage": 4.67, "elapsed_time": "0:50:49", "remaining_time": "17:17:44", "throughput": 3348.48, "total_tokens": 10211680} +{"current_steps": 8390, "total_steps": 179580, "loss": 0.2277, "lr": 2.335727809332888e-05, "epoch": 0.9344024947098786, "percentage": 4.67, "elapsed_time": "0:50:51", "remaining_time": "17:17:43", "throughput": 3348.49, "total_tokens": 10218048} +{"current_steps": 8395, "total_steps": 179580, "loss": 0.1153, "lr": 2.3371199465419314e-05, "epoch": 0.9349593495934959, "percentage": 4.67, "elapsed_time": "0:50:53", "remaining_time": "17:17:42", "throughput": 3348.49, "total_tokens": 10224160} +{"current_steps": 8400, "total_steps": 179580, "loss": 0.0776, "lr": 2.3385120837509748e-05, "epoch": 0.9355162044771133, "percentage": 4.68, "elapsed_time": "0:50:55", "remaining_time": "17:17:39", "throughput": 3348.48, "total_tokens": 10230016} +{"current_steps": 8405, "total_steps": 179580, "loss": 0.0795, "lr": 2.339904220960018e-05, "epoch": 0.9360730593607306, "percentage": 4.68, "elapsed_time": "0:50:56", "remaining_time": "17:17:37", "throughput": 3348.48, "total_tokens": 10236128} +{"current_steps": 8410, "total_steps": 179580, "loss": 0.1114, "lr": 2.341296358169061e-05, "epoch": 0.9366299142443479, "percentage": 4.68, "elapsed_time": "0:50:58", "remaining_time": "17:17:36", "throughput": 3348.48, "total_tokens": 10242304} +{"current_steps": 8415, "total_steps": 179580, "loss": 0.2902, "lr": 2.3426884953781044e-05, "epoch": 0.9371867691279653, "percentage": 4.69, "elapsed_time": "0:51:00", "remaining_time": "17:17:32", "throughput": 3348.49, "total_tokens": 10248096} +{"current_steps": 8420, "total_steps": 179580, "loss": 0.2129, "lr": 2.344080632587148e-05, "epoch": 0.9377436240115826, "percentage": 4.69, "elapsed_time": "0:51:02", "remaining_time": "17:17:28", "throughput": 3348.45, "total_tokens": 10253792} +{"current_steps": 8425, "total_steps": 179580, "loss": 0.1146, "lr": 2.3454727697961913e-05, "epoch": 0.9383004788952, "percentage": 4.69, "elapsed_time": "0:51:04", "remaining_time": "17:17:27", "throughput": 3348.45, "total_tokens": 10259936} +{"current_steps": 8430, "total_steps": 179580, "loss": 0.3063, "lr": 2.3468649070052347e-05, "epoch": 0.9388573337788172, "percentage": 4.69, "elapsed_time": "0:51:05", "remaining_time": "17:17:22", "throughput": 3348.41, "total_tokens": 10265408} +{"current_steps": 8435, "total_steps": 179580, "loss": 0.117, "lr": 2.3482570442142778e-05, "epoch": 0.9394141886624345, "percentage": 4.7, "elapsed_time": "0:51:07", "remaining_time": "17:17:22", "throughput": 3348.42, "total_tokens": 10271840} +{"current_steps": 8440, "total_steps": 179580, "loss": 0.3051, "lr": 2.3496491814233212e-05, "epoch": 0.9399710435460519, "percentage": 4.7, "elapsed_time": "0:51:09", "remaining_time": "17:17:19", "throughput": 3348.42, "total_tokens": 10277664} +{"current_steps": 8445, "total_steps": 179580, "loss": 0.1729, "lr": 2.3510413186323647e-05, "epoch": 0.9405278984296692, "percentage": 4.7, "elapsed_time": "0:51:11", "remaining_time": "17:17:19", "throughput": 3348.41, "total_tokens": 10284000} +{"current_steps": 8450, "total_steps": 179580, "loss": 0.1878, "lr": 2.352433455841408e-05, "epoch": 0.9410847533132866, "percentage": 4.71, "elapsed_time": "0:51:13", "remaining_time": "17:17:17", "throughput": 3348.42, "total_tokens": 10290208} +{"current_steps": 8455, "total_steps": 179580, "loss": 0.1655, "lr": 2.3538255930504512e-05, "epoch": 0.9416416081969039, "percentage": 4.71, "elapsed_time": "0:51:14", "remaining_time": "17:17:16", "throughput": 3348.42, "total_tokens": 10296320} +{"current_steps": 8460, "total_steps": 179580, "loss": 0.1338, "lr": 2.3552177302594943e-05, "epoch": 0.9421984630805212, "percentage": 4.71, "elapsed_time": "0:51:16", "remaining_time": "17:17:15", "throughput": 3348.44, "total_tokens": 10302688} +{"current_steps": 8465, "total_steps": 179580, "loss": 0.144, "lr": 2.3566098674685377e-05, "epoch": 0.9427553179641386, "percentage": 4.71, "elapsed_time": "0:51:18", "remaining_time": "17:17:14", "throughput": 3348.46, "total_tokens": 10308928} +{"current_steps": 8470, "total_steps": 179580, "loss": 0.1239, "lr": 2.358002004677581e-05, "epoch": 0.9433121728477559, "percentage": 4.72, "elapsed_time": "0:51:20", "remaining_time": "17:17:12", "throughput": 3348.47, "total_tokens": 10315008} +{"current_steps": 8475, "total_steps": 179580, "loss": 0.2772, "lr": 2.3593941418866246e-05, "epoch": 0.9438690277313732, "percentage": 4.72, "elapsed_time": "0:51:22", "remaining_time": "17:17:07", "throughput": 3348.41, "total_tokens": 10320384} +{"current_steps": 8480, "total_steps": 179580, "loss": 0.2217, "lr": 2.3607862790956677e-05, "epoch": 0.9444258826149905, "percentage": 4.72, "elapsed_time": "0:51:23", "remaining_time": "17:17:05", "throughput": 3348.41, "total_tokens": 10326464} +{"current_steps": 8485, "total_steps": 179580, "loss": 0.0868, "lr": 2.362178416304711e-05, "epoch": 0.9449827374986078, "percentage": 4.72, "elapsed_time": "0:51:25", "remaining_time": "17:17:03", "throughput": 3348.42, "total_tokens": 10332640} +{"current_steps": 8490, "total_steps": 179580, "loss": 0.1422, "lr": 2.3635705535137545e-05, "epoch": 0.9455395923822252, "percentage": 4.73, "elapsed_time": "0:51:27", "remaining_time": "17:17:01", "throughput": 3348.4, "total_tokens": 10338560} +{"current_steps": 8495, "total_steps": 179580, "loss": 0.0788, "lr": 2.364962690722798e-05, "epoch": 0.9460964472658425, "percentage": 4.73, "elapsed_time": "0:51:29", "remaining_time": "17:17:01", "throughput": 3348.44, "total_tokens": 10345088} +{"current_steps": 8500, "total_steps": 179580, "loss": 0.0743, "lr": 2.366354827931841e-05, "epoch": 0.9466533021494599, "percentage": 4.73, "elapsed_time": "0:51:31", "remaining_time": "17:17:00", "throughput": 3348.42, "total_tokens": 10351296} +{"current_steps": 8505, "total_steps": 179580, "loss": 0.5171, "lr": 2.367746965140884e-05, "epoch": 0.9472101570330772, "percentage": 4.74, "elapsed_time": "0:51:33", "remaining_time": "17:16:58", "throughput": 3348.4, "total_tokens": 10357248} +{"current_steps": 8510, "total_steps": 179580, "loss": 0.0495, "lr": 2.3691391023499276e-05, "epoch": 0.9477670119166945, "percentage": 4.74, "elapsed_time": "0:51:35", "remaining_time": "17:16:57", "throughput": 3348.39, "total_tokens": 10363488} +{"current_steps": 8515, "total_steps": 179580, "loss": 0.1179, "lr": 2.370531239558971e-05, "epoch": 0.9483238668003119, "percentage": 4.74, "elapsed_time": "0:51:36", "remaining_time": "17:16:55", "throughput": 3348.38, "total_tokens": 10369440} +{"current_steps": 8520, "total_steps": 179580, "loss": 0.1628, "lr": 2.3719233767680145e-05, "epoch": 0.9488807216839291, "percentage": 4.74, "elapsed_time": "0:51:38", "remaining_time": "17:16:53", "throughput": 3348.39, "total_tokens": 10375648} +{"current_steps": 8525, "total_steps": 179580, "loss": 0.1765, "lr": 2.3733155139770576e-05, "epoch": 0.9494375765675465, "percentage": 4.75, "elapsed_time": "0:51:40", "remaining_time": "17:16:54", "throughput": 3348.39, "total_tokens": 10382144} +{"current_steps": 8530, "total_steps": 179580, "loss": 0.1486, "lr": 2.374707651186101e-05, "epoch": 0.9499944314511638, "percentage": 4.75, "elapsed_time": "0:51:42", "remaining_time": "17:16:53", "throughput": 3348.41, "total_tokens": 10388480} +{"current_steps": 8535, "total_steps": 179580, "loss": 0.0948, "lr": 2.3760997883951444e-05, "epoch": 0.9505512863347811, "percentage": 4.75, "elapsed_time": "0:51:44", "remaining_time": "17:16:52", "throughput": 3348.41, "total_tokens": 10394624} +{"current_steps": 8540, "total_steps": 179580, "loss": 0.1501, "lr": 2.377491925604188e-05, "epoch": 0.9511081412183985, "percentage": 4.76, "elapsed_time": "0:51:46", "remaining_time": "17:16:53", "throughput": 3348.42, "total_tokens": 10401152} +{"current_steps": 8545, "total_steps": 179580, "loss": 0.2319, "lr": 2.378884062813231e-05, "epoch": 0.9516649961020158, "percentage": 4.76, "elapsed_time": "0:51:48", "remaining_time": "17:16:52", "throughput": 3348.36, "total_tokens": 10407200} +{"current_steps": 8550, "total_steps": 179580, "loss": 0.1872, "lr": 2.380276200022274e-05, "epoch": 0.9522218509856332, "percentage": 4.76, "elapsed_time": "0:51:49", "remaining_time": "17:16:50", "throughput": 3348.23, "total_tokens": 10412960} +{"current_steps": 8555, "total_steps": 179580, "loss": 0.1685, "lr": 2.3816683372313175e-05, "epoch": 0.9527787058692505, "percentage": 4.76, "elapsed_time": "0:51:51", "remaining_time": "17:16:50", "throughput": 3348.27, "total_tokens": 10419424} +{"current_steps": 8560, "total_steps": 179580, "loss": 0.2944, "lr": 2.383060474440361e-05, "epoch": 0.9533355607528678, "percentage": 4.77, "elapsed_time": "0:51:53", "remaining_time": "17:16:50", "throughput": 3348.3, "total_tokens": 10425888} +{"current_steps": 8565, "total_steps": 179580, "loss": 0.2067, "lr": 2.3844526116494043e-05, "epoch": 0.9538924156364851, "percentage": 4.77, "elapsed_time": "0:51:55", "remaining_time": "17:16:49", "throughput": 3348.32, "total_tokens": 10432224} +{"current_steps": 8570, "total_steps": 179580, "loss": 0.1899, "lr": 2.3858447488584478e-05, "epoch": 0.9544492705201024, "percentage": 4.77, "elapsed_time": "0:51:57", "remaining_time": "17:16:47", "throughput": 3348.31, "total_tokens": 10438208} +{"current_steps": 8575, "total_steps": 179580, "loss": 0.0898, "lr": 2.387236886067491e-05, "epoch": 0.9550061254037198, "percentage": 4.78, "elapsed_time": "0:51:59", "remaining_time": "17:16:45", "throughput": 3348.31, "total_tokens": 10444352} +{"current_steps": 8580, "total_steps": 179580, "loss": 0.1421, "lr": 2.3886290232765343e-05, "epoch": 0.9555629802873371, "percentage": 4.78, "elapsed_time": "0:52:01", "remaining_time": "17:16:43", "throughput": 3348.34, "total_tokens": 10450528} +{"current_steps": 8585, "total_steps": 179580, "loss": 0.1847, "lr": 2.3900211604855777e-05, "epoch": 0.9561198351709544, "percentage": 4.78, "elapsed_time": "0:52:02", "remaining_time": "17:16:43", "throughput": 3348.36, "total_tokens": 10456864} +{"current_steps": 8590, "total_steps": 179580, "loss": 0.2051, "lr": 2.391413297694621e-05, "epoch": 0.9566766900545718, "percentage": 4.78, "elapsed_time": "0:52:04", "remaining_time": "17:16:41", "throughput": 3348.33, "total_tokens": 10462880} +{"current_steps": 8595, "total_steps": 179580, "loss": 0.1508, "lr": 2.3928054349036643e-05, "epoch": 0.9572335449381891, "percentage": 4.79, "elapsed_time": "0:52:06", "remaining_time": "17:16:37", "throughput": 3348.33, "total_tokens": 10468672} +{"current_steps": 8600, "total_steps": 179580, "loss": 0.1962, "lr": 2.3941975721127074e-05, "epoch": 0.9577903998218065, "percentage": 4.79, "elapsed_time": "0:52:08", "remaining_time": "17:16:35", "throughput": 3348.35, "total_tokens": 10474784} +{"current_steps": 8605, "total_steps": 179580, "loss": 0.0402, "lr": 2.3955897093217508e-05, "epoch": 0.9583472547054238, "percentage": 4.79, "elapsed_time": "0:52:10", "remaining_time": "17:16:34", "throughput": 3348.36, "total_tokens": 10480960} +{"current_steps": 8610, "total_steps": 179580, "loss": 0.1439, "lr": 2.3969818465307942e-05, "epoch": 0.958904109589041, "percentage": 4.79, "elapsed_time": "0:52:12", "remaining_time": "17:16:34", "throughput": 3348.37, "total_tokens": 10487360} +{"current_steps": 8615, "total_steps": 179580, "loss": 0.0839, "lr": 2.3983739837398377e-05, "epoch": 0.9594609644726584, "percentage": 4.8, "elapsed_time": "0:52:13", "remaining_time": "17:16:32", "throughput": 3348.36, "total_tokens": 10493472} +{"current_steps": 8620, "total_steps": 179580, "loss": 0.196, "lr": 2.3997661209488807e-05, "epoch": 0.9600178193562757, "percentage": 4.8, "elapsed_time": "0:52:15", "remaining_time": "17:16:29", "throughput": 3348.39, "total_tokens": 10499424} +{"current_steps": 8625, "total_steps": 179580, "loss": 0.1261, "lr": 2.4011582581579242e-05, "epoch": 0.9605746742398931, "percentage": 4.8, "elapsed_time": "0:52:17", "remaining_time": "17:16:28", "throughput": 3348.38, "total_tokens": 10505536} +{"current_steps": 8630, "total_steps": 179580, "loss": 0.1285, "lr": 2.4025503953669676e-05, "epoch": 0.9611315291235104, "percentage": 4.81, "elapsed_time": "0:52:19", "remaining_time": "17:16:26", "throughput": 3348.36, "total_tokens": 10511616} +{"current_steps": 8635, "total_steps": 179580, "loss": 0.1094, "lr": 2.403942532576011e-05, "epoch": 0.9616883840071278, "percentage": 4.81, "elapsed_time": "0:52:21", "remaining_time": "17:16:22", "throughput": 3348.34, "total_tokens": 10517344} +{"current_steps": 8640, "total_steps": 179580, "loss": 0.2096, "lr": 2.405334669785054e-05, "epoch": 0.9622452388907451, "percentage": 4.81, "elapsed_time": "0:52:22", "remaining_time": "17:16:21", "throughput": 3348.36, "total_tokens": 10523488} +{"current_steps": 8645, "total_steps": 179580, "loss": 0.0931, "lr": 2.4067268069940972e-05, "epoch": 0.9628020937743624, "percentage": 4.81, "elapsed_time": "0:52:24", "remaining_time": "17:16:18", "throughput": 3348.37, "total_tokens": 10529568} +{"current_steps": 8650, "total_steps": 179580, "loss": 0.2176, "lr": 2.4081189442031407e-05, "epoch": 0.9633589486579798, "percentage": 4.82, "elapsed_time": "0:52:26", "remaining_time": "17:16:19", "throughput": 3348.38, "total_tokens": 10536160} +{"current_steps": 8655, "total_steps": 179580, "loss": 0.1623, "lr": 2.409511081412184e-05, "epoch": 0.963915803541597, "percentage": 4.82, "elapsed_time": "0:52:28", "remaining_time": "17:16:17", "throughput": 3348.38, "total_tokens": 10542080} +{"current_steps": 8660, "total_steps": 179580, "loss": 0.0764, "lr": 2.4109032186212275e-05, "epoch": 0.9644726584252143, "percentage": 4.82, "elapsed_time": "0:52:30", "remaining_time": "17:16:13", "throughput": 3348.36, "total_tokens": 10547776} +{"current_steps": 8665, "total_steps": 179580, "loss": 0.1692, "lr": 2.4122953558302706e-05, "epoch": 0.9650295133088317, "percentage": 4.83, "elapsed_time": "0:52:31", "remaining_time": "17:16:11", "throughput": 3348.36, "total_tokens": 10553888} +{"current_steps": 8670, "total_steps": 179580, "loss": 0.2313, "lr": 2.413687493039314e-05, "epoch": 0.965586368192449, "percentage": 4.83, "elapsed_time": "0:52:33", "remaining_time": "17:16:09", "throughput": 3348.37, "total_tokens": 10560000} +{"current_steps": 8675, "total_steps": 179580, "loss": 0.1382, "lr": 2.4150796302483575e-05, "epoch": 0.9661432230760664, "percentage": 4.83, "elapsed_time": "0:52:35", "remaining_time": "17:16:10", "throughput": 3348.4, "total_tokens": 10566560} +{"current_steps": 8680, "total_steps": 179580, "loss": 0.1173, "lr": 2.416471767457401e-05, "epoch": 0.9667000779596837, "percentage": 4.83, "elapsed_time": "0:52:37", "remaining_time": "17:16:09", "throughput": 3348.42, "total_tokens": 10572896} +{"current_steps": 8685, "total_steps": 179580, "loss": 0.2627, "lr": 2.417863904666444e-05, "epoch": 0.967256932843301, "percentage": 4.84, "elapsed_time": "0:52:39", "remaining_time": "17:16:08", "throughput": 3348.43, "total_tokens": 10579264} +{"current_steps": 8690, "total_steps": 179580, "loss": 0.1868, "lr": 2.419256041875487e-05, "epoch": 0.9678137877269184, "percentage": 4.84, "elapsed_time": "0:52:41", "remaining_time": "17:16:05", "throughput": 3348.38, "total_tokens": 10584928} +{"current_steps": 8695, "total_steps": 179580, "loss": 0.1949, "lr": 2.4206481790845305e-05, "epoch": 0.9683706426105357, "percentage": 4.84, "elapsed_time": "0:52:43", "remaining_time": "17:16:04", "throughput": 3348.39, "total_tokens": 10591104} +{"current_steps": 8700, "total_steps": 179580, "loss": 0.2754, "lr": 2.422040316293574e-05, "epoch": 0.9689274974941531, "percentage": 4.84, "elapsed_time": "0:52:44", "remaining_time": "17:16:02", "throughput": 3348.37, "total_tokens": 10597152} +{"current_steps": 8705, "total_steps": 179580, "loss": 0.1991, "lr": 2.4234324535026174e-05, "epoch": 0.9694843523777703, "percentage": 4.85, "elapsed_time": "0:52:46", "remaining_time": "17:16:01", "throughput": 3348.37, "total_tokens": 10603392} +{"current_steps": 8710, "total_steps": 179580, "loss": 0.1109, "lr": 2.424824590711661e-05, "epoch": 0.9700412072613877, "percentage": 4.85, "elapsed_time": "0:52:48", "remaining_time": "17:15:56", "throughput": 3348.33, "total_tokens": 10608800} +{"current_steps": 8715, "total_steps": 179580, "loss": 0.1243, "lr": 2.426216727920704e-05, "epoch": 0.970598062145005, "percentage": 4.85, "elapsed_time": "0:52:50", "remaining_time": "17:15:55", "throughput": 3348.33, "total_tokens": 10615072} +{"current_steps": 8720, "total_steps": 179580, "loss": 0.0888, "lr": 2.4276088651297474e-05, "epoch": 0.9711549170286223, "percentage": 4.86, "elapsed_time": "0:52:52", "remaining_time": "17:15:52", "throughput": 3348.31, "total_tokens": 10620864} +{"current_steps": 8725, "total_steps": 179580, "loss": 0.1699, "lr": 2.4290010023387908e-05, "epoch": 0.9717117719122397, "percentage": 4.86, "elapsed_time": "0:52:53", "remaining_time": "17:15:48", "throughput": 3348.24, "total_tokens": 10626336} +{"current_steps": 8730, "total_steps": 179580, "loss": 0.2186, "lr": 2.430393139547834e-05, "epoch": 0.972268626795857, "percentage": 4.86, "elapsed_time": "0:52:55", "remaining_time": "17:15:46", "throughput": 3348.23, "total_tokens": 10632448} +{"current_steps": 8735, "total_steps": 179580, "loss": 0.0874, "lr": 2.4317852767568773e-05, "epoch": 0.9728254816794744, "percentage": 4.86, "elapsed_time": "0:52:57", "remaining_time": "17:15:45", "throughput": 3348.24, "total_tokens": 10638624} +{"current_steps": 8740, "total_steps": 179580, "loss": 0.1426, "lr": 2.4331774139659204e-05, "epoch": 0.9733823365630917, "percentage": 4.87, "elapsed_time": "0:52:59", "remaining_time": "17:15:42", "throughput": 3348.24, "total_tokens": 10644608} +{"current_steps": 8745, "total_steps": 179580, "loss": 0.1238, "lr": 2.434569551174964e-05, "epoch": 0.973939191446709, "percentage": 4.87, "elapsed_time": "0:53:00", "remaining_time": "17:15:39", "throughput": 3348.21, "total_tokens": 10650368} +{"current_steps": 8750, "total_steps": 179580, "loss": 0.263, "lr": 2.4359616883840073e-05, "epoch": 0.9744960463303263, "percentage": 4.87, "elapsed_time": "0:53:02", "remaining_time": "17:15:35", "throughput": 3348.18, "total_tokens": 10656032} +{"current_steps": 8755, "total_steps": 179580, "loss": 0.1984, "lr": 2.4373538255930507e-05, "epoch": 0.9750529012139436, "percentage": 4.88, "elapsed_time": "0:53:04", "remaining_time": "17:15:33", "throughput": 3348.19, "total_tokens": 10662144} +{"current_steps": 8760, "total_steps": 179580, "loss": 0.2282, "lr": 2.4387459628020938e-05, "epoch": 0.975609756097561, "percentage": 4.88, "elapsed_time": "0:53:06", "remaining_time": "17:15:32", "throughput": 3348.21, "total_tokens": 10668352} +{"current_steps": 8765, "total_steps": 179580, "loss": 0.1833, "lr": 2.4401381000111373e-05, "epoch": 0.9761666109811783, "percentage": 4.88, "elapsed_time": "0:53:08", "remaining_time": "17:15:28", "throughput": 3348.19, "total_tokens": 10674080} +{"current_steps": 8770, "total_steps": 179580, "loss": 0.1231, "lr": 2.4415302372201807e-05, "epoch": 0.9767234658647956, "percentage": 4.88, "elapsed_time": "0:53:09", "remaining_time": "17:15:28", "throughput": 3348.19, "total_tokens": 10680320} +{"current_steps": 8775, "total_steps": 179580, "loss": 0.1322, "lr": 2.4429223744292238e-05, "epoch": 0.977280320748413, "percentage": 4.89, "elapsed_time": "0:53:11", "remaining_time": "17:15:22", "throughput": 3348.19, "total_tokens": 10685824} +{"current_steps": 8780, "total_steps": 179580, "loss": 0.1615, "lr": 2.4443145116382672e-05, "epoch": 0.9778371756320303, "percentage": 4.89, "elapsed_time": "0:53:13", "remaining_time": "17:15:19", "throughput": 3348.19, "total_tokens": 10691584} +{"current_steps": 8785, "total_steps": 179580, "loss": 0.2132, "lr": 2.4457066488473103e-05, "epoch": 0.9783940305156477, "percentage": 4.89, "elapsed_time": "0:53:14", "remaining_time": "17:15:15", "throughput": 3348.16, "total_tokens": 10697312} +{"current_steps": 8790, "total_steps": 179580, "loss": 0.1839, "lr": 2.4470987860563537e-05, "epoch": 0.978950885399265, "percentage": 4.89, "elapsed_time": "0:53:16", "remaining_time": "17:15:13", "throughput": 3348.16, "total_tokens": 10703328} +{"current_steps": 8795, "total_steps": 179580, "loss": 0.2643, "lr": 2.4484909232653972e-05, "epoch": 0.9795077402828822, "percentage": 4.9, "elapsed_time": "0:53:18", "remaining_time": "17:15:12", "throughput": 3348.18, "total_tokens": 10709664} +{"current_steps": 8800, "total_steps": 179580, "loss": 0.2051, "lr": 2.4498830604744406e-05, "epoch": 0.9800645951664996, "percentage": 4.9, "elapsed_time": "0:53:20", "remaining_time": "17:15:10", "throughput": 3348.16, "total_tokens": 10715648} +{"current_steps": 8805, "total_steps": 179580, "loss": 0.1825, "lr": 2.4512751976834837e-05, "epoch": 0.9806214500501169, "percentage": 4.9, "elapsed_time": "0:53:22", "remaining_time": "17:15:08", "throughput": 3348.15, "total_tokens": 10721632} +{"current_steps": 8810, "total_steps": 179580, "loss": 0.207, "lr": 2.452667334892527e-05, "epoch": 0.9811783049337343, "percentage": 4.91, "elapsed_time": "0:53:23", "remaining_time": "17:15:02", "throughput": 3348.13, "total_tokens": 10727008} +{"current_steps": 8815, "total_steps": 179580, "loss": 0.2259, "lr": 2.4540594721015706e-05, "epoch": 0.9817351598173516, "percentage": 4.91, "elapsed_time": "0:53:25", "remaining_time": "17:14:59", "throughput": 3348.1, "total_tokens": 10732800} +{"current_steps": 8820, "total_steps": 179580, "loss": 0.2483, "lr": 2.455451609310614e-05, "epoch": 0.9822920147009689, "percentage": 4.91, "elapsed_time": "0:53:27", "remaining_time": "17:14:57", "throughput": 3348.11, "total_tokens": 10738848} +{"current_steps": 8825, "total_steps": 179580, "loss": 0.0957, "lr": 2.456843746519657e-05, "epoch": 0.9828488695845863, "percentage": 4.91, "elapsed_time": "0:53:29", "remaining_time": "17:14:57", "throughput": 3348.12, "total_tokens": 10745216} +{"current_steps": 8830, "total_steps": 179580, "loss": 0.1159, "lr": 2.4582358837287002e-05, "epoch": 0.9834057244682036, "percentage": 4.92, "elapsed_time": "0:53:31", "remaining_time": "17:14:56", "throughput": 3348.13, "total_tokens": 10751552} +{"current_steps": 8835, "total_steps": 179580, "loss": 0.1194, "lr": 2.4596280209377436e-05, "epoch": 0.983962579351821, "percentage": 4.92, "elapsed_time": "0:53:33", "remaining_time": "17:14:55", "throughput": 3348.16, "total_tokens": 10757888} +{"current_steps": 8840, "total_steps": 179580, "loss": 0.1758, "lr": 2.461020158146787e-05, "epoch": 0.9845194342354382, "percentage": 4.92, "elapsed_time": "0:53:34", "remaining_time": "17:14:54", "throughput": 3348.18, "total_tokens": 10764128} +{"current_steps": 8845, "total_steps": 179580, "loss": 0.0636, "lr": 2.4624122953558305e-05, "epoch": 0.9850762891190555, "percentage": 4.93, "elapsed_time": "0:53:36", "remaining_time": "17:14:53", "throughput": 3348.17, "total_tokens": 10770336} +{"current_steps": 8850, "total_steps": 179580, "loss": 0.1447, "lr": 2.463804432564874e-05, "epoch": 0.9856331440026729, "percentage": 4.93, "elapsed_time": "0:53:38", "remaining_time": "17:14:50", "throughput": 3348.17, "total_tokens": 10776256} +{"current_steps": 8855, "total_steps": 179580, "loss": 0.2783, "lr": 2.465196569773917e-05, "epoch": 0.9861899988862902, "percentage": 4.93, "elapsed_time": "0:53:40", "remaining_time": "17:14:48", "throughput": 3348.19, "total_tokens": 10782272} +{"current_steps": 8860, "total_steps": 179580, "loss": 0.1361, "lr": 2.4665887069829604e-05, "epoch": 0.9867468537699076, "percentage": 4.93, "elapsed_time": "0:53:42", "remaining_time": "17:14:45", "throughput": 3348.18, "total_tokens": 10788256} +{"current_steps": 8865, "total_steps": 179580, "loss": 0.0791, "lr": 2.467980844192004e-05, "epoch": 0.9873037086535249, "percentage": 4.94, "elapsed_time": "0:53:43", "remaining_time": "17:14:44", "throughput": 3348.2, "total_tokens": 10794496} +{"current_steps": 8870, "total_steps": 179580, "loss": 0.21, "lr": 2.469372981401047e-05, "epoch": 0.9878605635371422, "percentage": 4.94, "elapsed_time": "0:53:45", "remaining_time": "17:14:42", "throughput": 3348.18, "total_tokens": 10800416} +{"current_steps": 8875, "total_steps": 179580, "loss": 0.1939, "lr": 2.4707651186100904e-05, "epoch": 0.9884174184207596, "percentage": 4.94, "elapsed_time": "0:53:47", "remaining_time": "17:14:40", "throughput": 3348.18, "total_tokens": 10806496} +{"current_steps": 8880, "total_steps": 179580, "loss": 0.2455, "lr": 2.4721572558191335e-05, "epoch": 0.9889742733043769, "percentage": 4.94, "elapsed_time": "0:53:49", "remaining_time": "17:14:38", "throughput": 3348.16, "total_tokens": 10812448} +{"current_steps": 8885, "total_steps": 179580, "loss": 0.1867, "lr": 2.473549393028177e-05, "epoch": 0.9895311281879942, "percentage": 4.95, "elapsed_time": "0:53:51", "remaining_time": "17:14:37", "throughput": 3348.17, "total_tokens": 10818752} +{"current_steps": 8890, "total_steps": 179580, "loss": 0.0892, "lr": 2.4749415302372204e-05, "epoch": 0.9900879830716115, "percentage": 4.95, "elapsed_time": "0:53:53", "remaining_time": "17:14:35", "throughput": 3348.16, "total_tokens": 10824896} +{"current_steps": 8895, "total_steps": 179580, "loss": 0.2366, "lr": 2.4763336674462638e-05, "epoch": 0.9906448379552288, "percentage": 4.95, "elapsed_time": "0:53:54", "remaining_time": "17:14:34", "throughput": 3348.15, "total_tokens": 10830976} +{"current_steps": 8900, "total_steps": 179580, "loss": 0.1083, "lr": 2.477725804655307e-05, "epoch": 0.9912016928388462, "percentage": 4.96, "elapsed_time": "0:53:56", "remaining_time": "17:14:34", "throughput": 3348.18, "total_tokens": 10837504} +{"current_steps": 8905, "total_steps": 179580, "loss": 0.1044, "lr": 2.4791179418643503e-05, "epoch": 0.9917585477224635, "percentage": 4.96, "elapsed_time": "0:53:58", "remaining_time": "17:14:32", "throughput": 3348.16, "total_tokens": 10843552} +{"current_steps": 8910, "total_steps": 179580, "loss": 0.0897, "lr": 2.4805100790733938e-05, "epoch": 0.9923154026060809, "percentage": 4.96, "elapsed_time": "0:54:00", "remaining_time": "17:14:28", "throughput": 3348.13, "total_tokens": 10849184} +{"current_steps": 8915, "total_steps": 179580, "loss": 0.1428, "lr": 2.481902216282437e-05, "epoch": 0.9928722574896982, "percentage": 4.96, "elapsed_time": "0:54:02", "remaining_time": "17:14:26", "throughput": 3348.13, "total_tokens": 10855200} +{"current_steps": 8920, "total_steps": 179580, "loss": 0.255, "lr": 2.4832943534914803e-05, "epoch": 0.9934291123733155, "percentage": 4.97, "elapsed_time": "0:54:03", "remaining_time": "17:14:25", "throughput": 3348.16, "total_tokens": 10861408} +{"current_steps": 8925, "total_steps": 179580, "loss": 0.2275, "lr": 2.4846864907005234e-05, "epoch": 0.9939859672569329, "percentage": 4.97, "elapsed_time": "0:54:05", "remaining_time": "17:14:22", "throughput": 3348.18, "total_tokens": 10867456} +{"current_steps": 8930, "total_steps": 179580, "loss": 0.1806, "lr": 2.4860786279095668e-05, "epoch": 0.9945428221405501, "percentage": 4.97, "elapsed_time": "0:54:07", "remaining_time": "17:14:21", "throughput": 3348.19, "total_tokens": 10873728} +{"current_steps": 8935, "total_steps": 179580, "loss": 0.1201, "lr": 2.4874707651186102e-05, "epoch": 0.9950996770241675, "percentage": 4.98, "elapsed_time": "0:54:09", "remaining_time": "17:14:21", "throughput": 3348.22, "total_tokens": 10880224} +{"current_steps": 8940, "total_steps": 179580, "loss": 0.2718, "lr": 2.4888629023276537e-05, "epoch": 0.9956565319077848, "percentage": 4.98, "elapsed_time": "0:54:11", "remaining_time": "17:14:19", "throughput": 3348.21, "total_tokens": 10886240} +{"current_steps": 8945, "total_steps": 179580, "loss": 0.12, "lr": 2.4902550395366968e-05, "epoch": 0.9962133867914021, "percentage": 4.98, "elapsed_time": "0:54:13", "remaining_time": "17:14:18", "throughput": 3348.2, "total_tokens": 10892352} +{"current_steps": 8950, "total_steps": 179580, "loss": 0.1014, "lr": 2.4916471767457402e-05, "epoch": 0.9967702416750195, "percentage": 4.98, "elapsed_time": "0:54:15", "remaining_time": "17:14:16", "throughput": 3348.23, "total_tokens": 10898592} +{"current_steps": 8955, "total_steps": 179580, "loss": 0.1661, "lr": 2.4930393139547836e-05, "epoch": 0.9973270965586368, "percentage": 4.99, "elapsed_time": "0:54:16", "remaining_time": "17:14:13", "throughput": 3348.23, "total_tokens": 10904384} +{"current_steps": 8960, "total_steps": 179580, "loss": 0.0867, "lr": 2.4944314511638267e-05, "epoch": 0.9978839514422542, "percentage": 4.99, "elapsed_time": "0:54:18", "remaining_time": "17:14:11", "throughput": 3348.22, "total_tokens": 10910496} +{"current_steps": 8965, "total_steps": 179580, "loss": 0.2204, "lr": 2.49582358837287e-05, "epoch": 0.9984408063258715, "percentage": 4.99, "elapsed_time": "0:54:20", "remaining_time": "17:14:09", "throughput": 3348.22, "total_tokens": 10916608} +{"current_steps": 8970, "total_steps": 179580, "loss": 0.153, "lr": 2.4972157255819133e-05, "epoch": 0.9989976612094889, "percentage": 4.99, "elapsed_time": "0:54:22", "remaining_time": "17:14:07", "throughput": 3348.21, "total_tokens": 10922624} +{"current_steps": 8975, "total_steps": 179580, "loss": 0.1942, "lr": 2.4986078627909567e-05, "epoch": 0.9995545160931061, "percentage": 5.0, "elapsed_time": "0:54:24", "remaining_time": "17:14:06", "throughput": 3348.18, "total_tokens": 10928640} +{"current_steps": 8979, "total_steps": 179580, "eval_loss": 0.1737435758113861, "epoch": 1.0, "percentage": 5.0, "elapsed_time": "0:56:17", "remaining_time": "17:49:36", "throughput": 3236.8, "total_tokens": 10932896} +{"current_steps": 8980, "total_steps": 179580, "loss": 0.1613, "lr": 2.5e-05, "epoch": 1.0001113709767235, "percentage": 5.0, "elapsed_time": "0:56:19", "remaining_time": "17:49:54", "throughput": 3235.85, "total_tokens": 10934144} +{"current_steps": 8985, "total_steps": 179580, "loss": 0.2357, "lr": 2.5013921372090432e-05, "epoch": 1.0006682258603408, "percentage": 5.0, "elapsed_time": "0:56:20", "remaining_time": "17:49:51", "throughput": 3235.92, "total_tokens": 10940256} +{"current_steps": 8990, "total_steps": 179580, "loss": 0.0445, "lr": 2.502784274418087e-05, "epoch": 1.0012250807439582, "percentage": 5.01, "elapsed_time": "0:56:22", "remaining_time": "17:49:49", "throughput": 3235.98, "total_tokens": 10946528} +{"current_steps": 8995, "total_steps": 179580, "loss": 0.2129, "lr": 2.5041764116271297e-05, "epoch": 1.0017819356275754, "percentage": 5.01, "elapsed_time": "0:56:24", "remaining_time": "17:49:46", "throughput": 3236.03, "total_tokens": 10952544}