| {"current_steps": 5, "total_steps": 3099, "loss": 15.8295, "lr": 6.451612903225807e-07, "epoch": 0.0048408568316592035, "percentage": 0.16, "elapsed_time": "0:16:05", "remaining_time": "6 days, 21:55:30", "throughput": 2042.78, "total_tokens": 1971904} | |
| {"current_steps": 10, "total_steps": 3099, "loss": 15.3582, "lr": 1.4516129032258066e-06, "epoch": 0.009681713663318407, "percentage": 0.32, "elapsed_time": "0:32:36", "remaining_time": "6 days, 23:53:42", "throughput": 2063.98, "total_tokens": 4038576} | |
| {"current_steps": 15, "total_steps": 3099, "loss": 12.8373, "lr": 2.2580645161290324e-06, "epoch": 0.014522570494977611, "percentage": 0.48, "elapsed_time": "0:46:06", "remaining_time": "6 days, 14:00:26", "throughput": 2129.5, "total_tokens": 5891616} | |
| {"current_steps": 20, "total_steps": 3099, "loss": 9.4205, "lr": 3.064516129032258e-06, "epoch": 0.019363427326636814, "percentage": 0.65, "elapsed_time": "0:58:42", "remaining_time": "6 days, 6:37:04", "throughput": 2228.65, "total_tokens": 7849472} | |
| {"current_steps": 25, "total_steps": 3099, "loss": 7.6571, "lr": 3.870967741935484e-06, "epoch": 0.024204284158296018, "percentage": 0.81, "elapsed_time": "1:03:40", "remaining_time": "5 days, 10:29:06", "throughput": 2536.34, "total_tokens": 9689648} | |
| {"current_steps": 30, "total_steps": 3099, "loss": 6.7016, "lr": 4.67741935483871e-06, "epoch": 0.029045140989955223, "percentage": 0.97, "elapsed_time": "1:09:55", "remaining_time": "4 days, 23:13:55", "throughput": 2777.06, "total_tokens": 11652144} | |
| {"current_steps": 35, "total_steps": 3099, "loss": 5.8834, "lr": 5.483870967741936e-06, "epoch": 0.03388599782161442, "percentage": 1.13, "elapsed_time": "1:14:43", "remaining_time": "4 days, 13:01:10", "throughput": 3021.11, "total_tokens": 13544176} | |
| {"current_steps": 40, "total_steps": 3099, "loss": 5.0909, "lr": 6.290322580645161e-06, "epoch": 0.03872685465327363, "percentage": 1.29, "elapsed_time": "1:18:58", "remaining_time": "4 days, 4:39:43", "throughput": 3232.05, "total_tokens": 15315344} | |
| {"current_steps": 45, "total_steps": 3099, "loss": 4.3397, "lr": 7.096774193548387e-06, "epoch": 0.04356771148493283, "percentage": 1.45, "elapsed_time": "1:23:11", "remaining_time": "3 days, 22:06:12", "throughput": 3424.59, "total_tokens": 17094640} | |
| {"current_steps": 50, "total_steps": 3099, "loss": 3.5344, "lr": 7.903225806451613e-06, "epoch": 0.048408568316592036, "percentage": 1.61, "elapsed_time": "1:28:40", "remaining_time": "3 days, 18:07:47", "throughput": 3568.95, "total_tokens": 18990000} | |
| {"current_steps": 55, "total_steps": 3099, "loss": 2.5445, "lr": 8.70967741935484e-06, "epoch": 0.05324942514825124, "percentage": 1.77, "elapsed_time": "1:37:40", "remaining_time": "3 days, 18:05:27", "throughput": 3558.82, "total_tokens": 20854912} | |
| {"current_steps": 60, "total_steps": 3099, "loss": 1.5114, "lr": 9.516129032258064e-06, "epoch": 0.058090281979910445, "percentage": 1.94, "elapsed_time": "1:51:29", "remaining_time": "3 days, 22:06:50", "throughput": 3398.66, "total_tokens": 22734480} | |
| {"current_steps": 65, "total_steps": 3099, "loss": 0.681, "lr": 1.0322580645161291e-05, "epoch": 0.06293113881156964, "percentage": 2.1, "elapsed_time": "2:08:14", "remaining_time": "4 days, 3:46:14", "throughput": 3210.69, "total_tokens": 24705984} | |
| {"current_steps": 70, "total_steps": 3099, "loss": 0.3083, "lr": 1.1129032258064517e-05, "epoch": 0.06777199564322885, "percentage": 2.26, "elapsed_time": "2:22:02", "remaining_time": "4 days, 6:26:38", "throughput": 3123.74, "total_tokens": 26623312} | |
| {"current_steps": 75, "total_steps": 3099, "loss": 0.2031, "lr": 1.1935483870967743e-05, "epoch": 0.07261285247488805, "percentage": 2.42, "elapsed_time": "2:37:28", "remaining_time": "4 days, 9:49:26", "throughput": 3022.73, "total_tokens": 28560464} | |
| {"current_steps": 80, "total_steps": 3099, "loss": 0.1776, "lr": 1.2741935483870968e-05, "epoch": 0.07745370930654726, "percentage": 2.58, "elapsed_time": "2:50:41", "remaining_time": "4 days, 11:21:31", "throughput": 2963.77, "total_tokens": 30353664} | |
| {"current_steps": 85, "total_steps": 3099, "loss": 0.1556, "lr": 1.3548387096774195e-05, "epoch": 0.08229456613820646, "percentage": 2.74, "elapsed_time": "3:05:26", "remaining_time": "4 days, 13:35:50", "throughput": 2900.74, "total_tokens": 32276544} | |
| {"current_steps": 90, "total_steps": 3099, "loss": 0.1393, "lr": 1.4354838709677421e-05, "epoch": 0.08713542296986566, "percentage": 2.9, "elapsed_time": "3:16:49", "remaining_time": "4 days, 13:40:46", "throughput": 2890.58, "total_tokens": 34137648} | |
| {"current_steps": 95, "total_steps": 3099, "loss": 0.1302, "lr": 1.5161290322580646e-05, "epoch": 0.09197627980152487, "percentage": 3.07, "elapsed_time": "3:21:34", "remaining_time": "4 days, 10:13:46", "throughput": 2976.53, "total_tokens": 35998352} | |
| {"current_steps": 100, "total_steps": 3099, "loss": 0.1201, "lr": 1.596774193548387e-05, "epoch": 0.09681713663318407, "percentage": 3.23, "elapsed_time": "3:26:34", "remaining_time": "4 days, 7:15:03", "throughput": 3055.39, "total_tokens": 37869184} | |
| {"current_steps": 105, "total_steps": 3099, "loss": 0.1209, "lr": 1.6774193548387098e-05, "epoch": 0.10165799346484328, "percentage": 3.39, "elapsed_time": "3:31:42", "remaining_time": "4 days, 4:36:45", "throughput": 3124.89, "total_tokens": 39694272} | |
| {"current_steps": 110, "total_steps": 3099, "loss": 0.1209, "lr": 1.7580645161290325e-05, "epoch": 0.10649885029650248, "percentage": 3.55, "elapsed_time": "3:36:29", "remaining_time": "4 days, 2:02:30", "throughput": 3197.28, "total_tokens": 41530000} | |
| {"current_steps": 115, "total_steps": 3099, "loss": 0.1105, "lr": 1.838709677419355e-05, "epoch": 0.11133970712816169, "percentage": 3.71, "elapsed_time": "3:41:46", "remaining_time": "3 days, 23:54:26", "throughput": 3261.35, "total_tokens": 43396048} | |
| {"current_steps": 120, "total_steps": 3099, "loss": 0.1074, "lr": 1.9193548387096774e-05, "epoch": 0.11618056395982089, "percentage": 3.87, "elapsed_time": "3:55:10", "remaining_time": "4 days, 1:18:07", "throughput": 3213.54, "total_tokens": 45343968} | |
| {"current_steps": 125, "total_steps": 3099, "loss": 0.1037, "lr": 2e-05, "epoch": 0.1210214207914801, "percentage": 4.03, "elapsed_time": "4:10:40", "remaining_time": "4 days, 3:24:03", "throughput": 3146.31, "total_tokens": 47322080} | |
| {"current_steps": 130, "total_steps": 3099, "loss": 0.1062, "lr": 2.0806451612903226e-05, "epoch": 0.12586227762313928, "percentage": 4.19, "elapsed_time": "4:27:19", "remaining_time": "4 days, 5:45:10", "throughput": 3071.01, "total_tokens": 49256592} | |
| {"current_steps": 135, "total_steps": 3099, "loss": 0.1022, "lr": 2.1612903225806454e-05, "epoch": 0.1307031344547985, "percentage": 4.36, "elapsed_time": "4:41:21", "remaining_time": "4 days, 6:57:27", "throughput": 3030.19, "total_tokens": 51154720} | |
| {"current_steps": 140, "total_steps": 3099, "loss": 0.0953, "lr": 2.2419354838709678e-05, "epoch": 0.1355439912864577, "percentage": 4.52, "elapsed_time": "5:00:21", "remaining_time": "4 days, 9:48:20", "throughput": 2955.59, "total_tokens": 53264704} | |
| {"current_steps": 145, "total_steps": 3099, "loss": 0.1071, "lr": 2.3225806451612906e-05, "epoch": 0.1403848481181169, "percentage": 4.68, "elapsed_time": "5:13:21", "remaining_time": "4 days, 10:23:52", "throughput": 2930.58, "total_tokens": 55099456} | |
| {"current_steps": 150, "total_steps": 3099, "loss": 0.1, "lr": 2.403225806451613e-05, "epoch": 0.1452257049497761, "percentage": 4.84, "elapsed_time": "5:28:25", "remaining_time": "4 days, 11:36:47", "throughput": 2894.33, "total_tokens": 57033824} | |
| {"current_steps": 155, "total_steps": 3099, "loss": 0.1024, "lr": 2.4838709677419354e-05, "epoch": 0.15006656178143532, "percentage": 5.0, "elapsed_time": "5:41:50", "remaining_time": "4 days, 12:12:51", "throughput": 2870.53, "total_tokens": 58876656} | |
| {"current_steps": 160, "total_steps": 3099, "loss": 0.0978, "lr": 2.5645161290322582e-05, "epoch": 0.1549074186130945, "percentage": 5.16, "elapsed_time": "5:57:54", "remaining_time": "4 days, 13:34:27", "throughput": 2834.82, "total_tokens": 60877568} | |
| {"current_steps": 165, "total_steps": 3099, "loss": 0.1081, "lr": 2.645161290322581e-05, "epoch": 0.15974827544475373, "percentage": 5.32, "elapsed_time": "6:11:59", "remaining_time": "4 days, 14:14:37", "throughput": 2811.77, "total_tokens": 62756608} | |
| {"current_steps": 170, "total_steps": 3099, "loss": 0.0934, "lr": 2.7258064516129034e-05, "epoch": 0.16458913227641292, "percentage": 5.49, "elapsed_time": "6:27:02", "remaining_time": "4 days, 15:08:38", "throughput": 2785.54, "total_tokens": 64688544} | |
| {"current_steps": 175, "total_steps": 3099, "loss": 0.0956, "lr": 2.806451612903226e-05, "epoch": 0.16942998910807214, "percentage": 5.65, "elapsed_time": "6:38:59", "remaining_time": "4 days, 15:06:37", "throughput": 2777.96, "total_tokens": 66503488} | |
| {"current_steps": 180, "total_steps": 3099, "loss": 0.0945, "lr": 2.8870967741935483e-05, "epoch": 0.17427084593973133, "percentage": 5.81, "elapsed_time": "6:53:45", "remaining_time": "4 days, 15:49:42", "throughput": 2756.31, "total_tokens": 68426064} | |
| {"current_steps": 185, "total_steps": 3099, "loss": 0.0957, "lr": 2.967741935483871e-05, "epoch": 0.17911170277139055, "percentage": 5.97, "elapsed_time": "7:07:32", "remaining_time": "4 days, 16:14:15", "throughput": 2740.53, "total_tokens": 70300224} | |
| {"current_steps": 190, "total_steps": 3099, "loss": 0.1048, "lr": 3.0483870967741935e-05, "epoch": 0.18395255960304974, "percentage": 6.13, "elapsed_time": "7:22:12", "remaining_time": "4 days, 16:50:23", "throughput": 2719.46, "total_tokens": 72153584} | |
| {"current_steps": 195, "total_steps": 3099, "loss": 0.1038, "lr": 3.1290322580645166e-05, "epoch": 0.18879341643470895, "percentage": 6.29, "elapsed_time": "7:35:53", "remaining_time": "4 days, 17:09:19", "throughput": 2704.9, "total_tokens": 73989040} | |
| {"current_steps": 200, "total_steps": 3099, "loss": 0.106, "lr": 3.2096774193548393e-05, "epoch": 0.19363427326636815, "percentage": 6.45, "elapsed_time": "7:49:40", "remaining_time": "4 days, 17:27:52", "throughput": 2691.41, "total_tokens": 75844448} | |
| {"current_steps": 205, "total_steps": 3099, "loss": 0.0979, "lr": 3.2903225806451614e-05, "epoch": 0.19847513009802736, "percentage": 6.62, "elapsed_time": "8:02:34", "remaining_time": "4 days, 17:32:35", "throughput": 2681.0, "total_tokens": 77627520} | |
| {"current_steps": 210, "total_steps": 3099, "loss": 0.0953, "lr": 3.370967741935484e-05, "epoch": 0.20331598692968655, "percentage": 6.78, "elapsed_time": "8:15:08", "remaining_time": "4 days, 17:31:47", "throughput": 2673.18, "total_tokens": 79416736} | |
| {"current_steps": 215, "total_steps": 3099, "loss": 0.0936, "lr": 3.451612903225806e-05, "epoch": 0.20815684376134574, "percentage": 6.94, "elapsed_time": "8:29:36", "remaining_time": "4 days, 17:55:45", "throughput": 2661.43, "total_tokens": 81375920} | |
| {"current_steps": 220, "total_steps": 3099, "loss": 0.0954, "lr": 3.532258064516129e-05, "epoch": 0.21299770059300496, "percentage": 7.1, "elapsed_time": "8:42:28", "remaining_time": "4 days, 17:57:20", "throughput": 2654.99, "total_tokens": 83230304} | |
| {"current_steps": 225, "total_steps": 3099, "loss": 0.095, "lr": 3.612903225806452e-05, "epoch": 0.21783855742466415, "percentage": 7.26, "elapsed_time": "8:57:41", "remaining_time": "4 days, 18:28:04", "throughput": 2643.17, "total_tokens": 85271952} | |
| {"current_steps": 230, "total_steps": 3099, "loss": 0.0898, "lr": 3.6935483870967746e-05, "epoch": 0.22267941425632337, "percentage": 7.42, "elapsed_time": "9:10:22", "remaining_time": "4 days, 18:25:21", "throughput": 2637.23, "total_tokens": 87088336} | |
| {"current_steps": 235, "total_steps": 3099, "loss": 0.1018, "lr": 3.7741935483870974e-05, "epoch": 0.22752027108798256, "percentage": 7.58, "elapsed_time": "9:21:55", "remaining_time": "4 days, 18:08:13", "throughput": 2633.98, "total_tokens": 88804864} | |
| {"current_steps": 240, "total_steps": 3099, "loss": 0.1003, "lr": 3.8548387096774195e-05, "epoch": 0.23236112791964178, "percentage": 7.74, "elapsed_time": "9:34:20", "remaining_time": "4 days, 18:01:53", "throughput": 2631.36, "total_tokens": 90678512} | |
| {"current_steps": 245, "total_steps": 3099, "loss": 0.1012, "lr": 3.935483870967742e-05, "epoch": 0.23720198475130097, "percentage": 7.91, "elapsed_time": "9:47:39", "remaining_time": "4 days, 18:05:41", "throughput": 2623.85, "total_tokens": 92516880} | |
| {"current_steps": 250, "total_steps": 3099, "loss": 0.0944, "lr": 4.016129032258065e-05, "epoch": 0.2420428415829602, "percentage": 8.07, "elapsed_time": "10:01:20", "remaining_time": "4 days, 18:12:48", "throughput": 2616.04, "total_tokens": 94387008} | |
| {"current_steps": 255, "total_steps": 3099, "loss": 0.0952, "lr": 4.096774193548387e-05, "epoch": 0.24688369841461938, "percentage": 8.23, "elapsed_time": "10:15:29", "remaining_time": "4 days, 18:24:29", "throughput": 2607.45, "total_tokens": 96291040} | |
| {"current_steps": 260, "total_steps": 3099, "loss": 0.1029, "lr": 4.17741935483871e-05, "epoch": 0.25172455524627857, "percentage": 8.39, "elapsed_time": "10:28:34", "remaining_time": "4 days, 18:23:33", "throughput": 2601.72, "total_tokens": 98122448} | |
| {"current_steps": 265, "total_steps": 3099, "loss": 0.0955, "lr": 4.258064516129032e-05, "epoch": 0.2565654120779378, "percentage": 8.55, "elapsed_time": "10:41:26", "remaining_time": "4 days, 18:19:51", "throughput": 2598.82, "total_tokens": 100020384} | |
| {"current_steps": 270, "total_steps": 3099, "loss": 0.0966, "lr": 4.3387096774193554e-05, "epoch": 0.261406268909597, "percentage": 8.71, "elapsed_time": "10:53:20", "remaining_time": "4 days, 18:05:37", "throughput": 2597.17, "total_tokens": 101811184} | |
| {"current_steps": 275, "total_steps": 3099, "loss": 0.0977, "lr": 4.4193548387096775e-05, "epoch": 0.2662471257412562, "percentage": 8.87, "elapsed_time": "11:03:58", "remaining_time": "4 days, 17:38:27", "throughput": 2599.1, "total_tokens": 103544960} | |
| {"current_steps": 280, "total_steps": 3099, "loss": 0.0941, "lr": 4.5e-05, "epoch": 0.2710879825729154, "percentage": 9.04, "elapsed_time": "11:15:01", "remaining_time": "4 days, 17:16:05", "throughput": 2603.13, "total_tokens": 105431200} | |
| {"current_steps": 285, "total_steps": 3099, "loss": 0.0973, "lr": 4.580645161290323e-05, "epoch": 0.27592883940457463, "percentage": 9.2, "elapsed_time": "11:21:03", "remaining_time": "4 days, 16:04:34", "throughput": 2627.49, "total_tokens": 107368704} | |
| {"current_steps": 290, "total_steps": 3099, "loss": 0.0949, "lr": 4.661290322580645e-05, "epoch": 0.2807696962362338, "percentage": 9.36, "elapsed_time": "11:26:30", "remaining_time": "4 days, 14:49:41", "throughput": 2652.47, "total_tokens": 109257200} | |
| {"current_steps": 295, "total_steps": 3099, "loss": 0.0953, "lr": 4.741935483870968e-05, "epoch": 0.285610553067893, "percentage": 9.52, "elapsed_time": "11:31:35", "remaining_time": "4 days, 13:33:41", "throughput": 2678.6, "total_tokens": 111150704} | |
| {"current_steps": 300, "total_steps": 3099, "loss": 0.097, "lr": 4.822580645161291e-05, "epoch": 0.2904514098995522, "percentage": 9.68, "elapsed_time": "11:37:05", "remaining_time": "4 days, 12:23:47", "throughput": 2702.56, "total_tokens": 113034512} | |
| {"current_steps": 305, "total_steps": 3099, "loss": 0.0897, "lr": 4.903225806451613e-05, "epoch": 0.29529226673121145, "percentage": 9.84, "elapsed_time": "11:42:41", "remaining_time": "4 days, 11:17:05", "throughput": 2726.12, "total_tokens": 114937056} | |
| {"current_steps": 310, "total_steps": 3099, "loss": 0.0887, "lr": 4.983870967741936e-05, "epoch": 0.30013312356287064, "percentage": 10.0, "elapsed_time": "11:48:59", "remaining_time": "4 days, 10:18:35", "throughput": 2749.36, "total_tokens": 116955552} | |
| {"current_steps": 315, "total_steps": 3099, "loss": 0.0981, "lr": 4.999974623485097e-05, "epoch": 0.30497398039452983, "percentage": 10.16, "elapsed_time": "11:54:30", "remaining_time": "4 days, 9:14:54", "throughput": 2771.84, "total_tokens": 118830688} | |
| {"current_steps": 320, "total_steps": 3099, "loss": 0.0974, "lr": 4.999871532276243e-05, "epoch": 0.309814837226189, "percentage": 10.33, "elapsed_time": "11:59:24", "remaining_time": "4 days, 8:07:38", "throughput": 2796.07, "total_tokens": 120691504} | |
| {"current_steps": 325, "total_steps": 3099, "loss": 0.0948, "lr": 4.999689143608857e-05, "epoch": 0.3146556940578482, "percentage": 10.49, "elapsed_time": "12:04:17", "remaining_time": "4 days, 7:02:06", "throughput": 2820.24, "total_tokens": 122560384} | |
| {"current_steps": 330, "total_steps": 3099, "loss": 0.0901, "lr": 4.999427463268419e-05, "epoch": 0.31949655088950746, "percentage": 10.65, "elapsed_time": "12:09:56", "remaining_time": "4 days, 6:04:52", "throughput": 2842.54, "total_tokens": 124493200} | |
| {"current_steps": 335, "total_steps": 3099, "loss": 0.09, "lr": 4.999086499555591e-05, "epoch": 0.32433740772116665, "percentage": 10.81, "elapsed_time": "12:15:04", "remaining_time": "4 days, 5:04:55", "throughput": 2864.86, "total_tokens": 126353344} | |
| {"current_steps": 340, "total_steps": 3099, "loss": 0.0943, "lr": 4.9986662632859504e-05, "epoch": 0.32917826455282584, "percentage": 10.97, "elapsed_time": "12:20:10", "remaining_time": "4 days, 4:06:20", "throughput": 2886.17, "total_tokens": 128177040} | |
| {"current_steps": 345, "total_steps": 3099, "loss": 0.0921, "lr": 4.9981667677896506e-05, "epoch": 0.33401912138448503, "percentage": 11.13, "elapsed_time": "12:24:30", "remaining_time": "4 days, 3:03:05", "throughput": 2909.56, "total_tokens": 129970848} | |
| {"current_steps": 350, "total_steps": 3099, "loss": 0.0933, "lr": 4.997588028910993e-05, "epoch": 0.3388599782161443, "percentage": 11.29, "elapsed_time": "12:30:22", "remaining_time": "4 days, 2:13:41", "throughput": 2930.39, "total_tokens": 131934512} | |
| {"current_steps": 355, "total_steps": 3099, "loss": 0.0919, "lr": 4.996930065007932e-05, "epoch": 0.34370083504780347, "percentage": 11.46, "elapsed_time": "12:35:35", "remaining_time": "4 days, 1:20:25", "throughput": 2951.94, "total_tokens": 133828000} | |
| {"current_steps": 360, "total_steps": 3099, "loss": 0.0894, "lr": 4.996192896951485e-05, "epoch": 0.34854169187946266, "percentage": 11.62, "elapsed_time": "12:40:01", "remaining_time": "4 days, 0:22:33", "throughput": 2974.79, "total_tokens": 135655808} | |
| {"current_steps": 365, "total_steps": 3099, "loss": 0.089, "lr": 4.995376548125075e-05, "epoch": 0.35338254871112185, "percentage": 11.78, "elapsed_time": "12:45:22", "remaining_time": "3 days, 23:32:55", "throughput": 2995.25, "total_tokens": 137547952} | |
| {"current_steps": 370, "total_steps": 3099, "loss": 0.0963, "lr": 4.994481044423788e-05, "epoch": 0.3582234055427811, "percentage": 11.94, "elapsed_time": "12:50:31", "remaining_time": "3 days, 22:43:08", "throughput": 3015.45, "total_tokens": 139408624} | |
| {"current_steps": 375, "total_steps": 3099, "loss": 0.098, "lr": 4.99350641425355e-05, "epoch": 0.3630642623744403, "percentage": 12.1, "elapsed_time": "12:54:54", "remaining_time": "3 days, 21:48:56", "throughput": 3035.77, "total_tokens": 141146720} | |
| {"current_steps": 380, "total_steps": 3099, "loss": 0.0927, "lr": 4.99245268853023e-05, "epoch": 0.3679051192060995, "percentage": 12.26, "elapsed_time": "12:58:44", "remaining_time": "3 days, 20:52:05", "throughput": 3057.84, "total_tokens": 142875840} | |
| {"current_steps": 385, "total_steps": 3099, "loss": 0.0881, "lr": 4.9913199006786515e-05, "epoch": 0.37274597603775866, "percentage": 12.42, "elapsed_time": "13:04:41", "remaining_time": "3 days, 20:11:37", "throughput": 3077.16, "total_tokens": 144878720} | |
| {"current_steps": 390, "total_steps": 3099, "loss": 0.1036, "lr": 4.9901080866315416e-05, "epoch": 0.3775868328694179, "percentage": 12.58, "elapsed_time": "13:08:41", "remaining_time": "3 days, 19:18:20", "throughput": 3098.06, "total_tokens": 146604080} | |
| {"current_steps": 395, "total_steps": 3099, "loss": 0.0879, "lr": 4.988817284828386e-05, "epoch": 0.3824276897010771, "percentage": 12.75, "elapsed_time": "13:13:45", "remaining_time": "3 days, 18:33:42", "throughput": 3118.21, "total_tokens": 148505760} | |
| {"current_steps": 400, "total_steps": 3099, "loss": 0.0893, "lr": 4.9874475362142076e-05, "epoch": 0.3872685465327363, "percentage": 12.91, "elapsed_time": "13:19:15", "remaining_time": "3 days, 17:53:00", "throughput": 3136.78, "total_tokens": 150426000} | |
| {"current_steps": 405, "total_steps": 3099, "loss": 0.0909, "lr": 4.9859988842382744e-05, "epoch": 0.3921094033643955, "percentage": 13.07, "elapsed_time": "13:24:01", "remaining_time": "3 days, 17:08:18", "throughput": 3155.84, "total_tokens": 152243872} | |
| {"current_steps": 410, "total_steps": 3099, "loss": 0.0947, "lr": 4.984471374852715e-05, "epoch": 0.3969502601960547, "percentage": 13.23, "elapsed_time": "13:28:46", "remaining_time": "3 days, 16:24:26", "throughput": 3174.57, "total_tokens": 154052240} | |
| {"current_steps": 415, "total_steps": 3099, "loss": 0.0907, "lr": 4.9828650565110644e-05, "epoch": 0.4017911170277139, "percentage": 13.39, "elapsed_time": "13:34:48", "remaining_time": "3 days, 15:49:41", "throughput": 3191.4, "total_tokens": 156020992} | |
| {"current_steps": 420, "total_steps": 3099, "loss": 0.09, "lr": 4.981179980166726e-05, "epoch": 0.4066319738593731, "percentage": 13.55, "elapsed_time": "13:40:30", "remaining_time": "3 days, 15:13:38", "throughput": 3208.12, "total_tokens": 157936240} | |
| {"current_steps": 425, "total_steps": 3099, "loss": 0.0903, "lr": 4.979416199271354e-05, "epoch": 0.4114728306910323, "percentage": 13.71, "elapsed_time": "13:44:50", "remaining_time": "3 days, 14:29:45", "throughput": 3227.52, "total_tokens": 159733040} | |
| {"current_steps": 430, "total_steps": 3099, "loss": 0.093, "lr": 4.977573769773162e-05, "epoch": 0.4163136875226915, "percentage": 13.88, "elapsed_time": "13:50:46", "remaining_time": "3 days, 13:56:38", "throughput": 3243.19, "total_tokens": 161662848} | |
| {"current_steps": 435, "total_steps": 3099, "loss": 0.0953, "lr": 4.975652750115143e-05, "epoch": 0.42115454435435073, "percentage": 14.04, "elapsed_time": "13:55:44", "remaining_time": "3 days, 13:18:10", "throughput": 3260.8, "total_tokens": 163510512} | |
| {"current_steps": 440, "total_steps": 3099, "loss": 0.0925, "lr": 4.973653201233219e-05, "epoch": 0.4259954011860099, "percentage": 14.2, "elapsed_time": "14:02:25", "remaining_time": "3 days, 12:50:58", "throughput": 3273.91, "total_tokens": 165482800} | |
| {"current_steps": 445, "total_steps": 3099, "loss": 0.0893, "lr": 4.971575186554307e-05, "epoch": 0.4308362580176691, "percentage": 14.36, "elapsed_time": "14:08:34", "remaining_time": "3 days, 12:20:57", "throughput": 3288.39, "total_tokens": 167426896} | |
| {"current_steps": 450, "total_steps": 3099, "loss": 0.0943, "lr": 4.969418771994309e-05, "epoch": 0.4356771148493283, "percentage": 14.52, "elapsed_time": "14:13:04", "remaining_time": "3 days, 11:41:45", "throughput": 3306.35, "total_tokens": 169233824} | |
| {"current_steps": 455, "total_steps": 3099, "loss": 0.0938, "lr": 4.967184025956015e-05, "epoch": 0.44051797168098755, "percentage": 14.68, "elapsed_time": "14:17:37", "remaining_time": "3 days, 11:03:38", "throughput": 3324.2, "total_tokens": 171055232} | |
| {"current_steps": 460, "total_steps": 3099, "loss": 0.0915, "lr": 4.9648710193269424e-05, "epoch": 0.44535882851264674, "percentage": 14.84, "elapsed_time": "14:22:23", "remaining_time": "3 days, 10:27:31", "throughput": 3341.35, "total_tokens": 172893920} | |
| {"current_steps": 465, "total_steps": 3099, "loss": 0.0849, "lr": 4.962479825477079e-05, "epoch": 0.45019968534430593, "percentage": 15.0, "elapsed_time": "14:27:40", "remaining_time": "3 days, 9:54:56", "throughput": 3357.3, "total_tokens": 174782016} | |
| {"current_steps": 470, "total_steps": 3099, "loss": 0.0886, "lr": 4.9600105202565605e-05, "epoch": 0.4550405421759651, "percentage": 15.17, "elapsed_time": "14:33:01", "remaining_time": "3 days, 9:23:20", "throughput": 3372.79, "total_tokens": 176671136} | |
| {"current_steps": 475, "total_steps": 3099, "loss": 0.0924, "lr": 4.9574631819932646e-05, "epoch": 0.45988139900762437, "percentage": 15.33, "elapsed_time": "14:38:16", "remaining_time": "3 days, 8:51:49", "throughput": 3387.76, "total_tokens": 178524848} | |
| {"current_steps": 480, "total_steps": 3099, "loss": 0.0872, "lr": 4.9548378914903225e-05, "epoch": 0.46472225583928356, "percentage": 15.49, "elapsed_time": "14:43:33", "remaining_time": "3 days, 8:20:56", "throughput": 3402.92, "total_tokens": 180401664} | |
| {"current_steps": 485, "total_steps": 3099, "loss": 0.0948, "lr": 4.95213473202356e-05, "epoch": 0.46956311267094275, "percentage": 15.65, "elapsed_time": "14:48:13", "remaining_time": "3 days, 7:47:15", "throughput": 3419.45, "total_tokens": 182234608} | |
| {"current_steps": 490, "total_steps": 3099, "loss": 0.0884, "lr": 4.9493537893388544e-05, "epoch": 0.47440396950260194, "percentage": 15.81, "elapsed_time": "14:54:05", "remaining_time": "3 days, 7:20:32", "throughput": 3432.88, "total_tokens": 184157296} | |
| {"current_steps": 495, "total_steps": 3099, "loss": 0.0916, "lr": 4.9464951516494116e-05, "epoch": 0.4792448263342612, "percentage": 15.97, "elapsed_time": "14:58:44", "remaining_time": "3 days, 6:47:53", "throughput": 3448.89, "total_tokens": 185978048} | |
| {"current_steps": 500, "total_steps": 3099, "loss": 0.0877, "lr": 4.943558909632975e-05, "epoch": 0.4840856831659204, "percentage": 16.13, "elapsed_time": "15:03:51", "remaining_time": "3 days, 6:18:14", "throughput": 3464.18, "total_tokens": 187867312} | |
| {"current_steps": 505, "total_steps": 3099, "loss": 0.0962, "lr": 4.94054515642894e-05, "epoch": 0.48892653999757957, "percentage": 16.3, "elapsed_time": "15:09:27", "remaining_time": "3 days, 5:51:31", "throughput": 3477.56, "total_tokens": 189760400} | |
| {"current_steps": 510, "total_steps": 3099, "loss": 0.084, "lr": 4.937453987635408e-05, "epoch": 0.49376739682923876, "percentage": 16.46, "elapsed_time": "15:16:27", "remaining_time": "3 days, 5:32:22", "throughput": 3487.58, "total_tokens": 191773264} | |
| {"current_steps": 515, "total_steps": 3099, "loss": 0.0868, "lr": 4.934285501306152e-05, "epoch": 0.498608253660898, "percentage": 16.62, "elapsed_time": "15:23:04", "remaining_time": "3 days, 5:11:31", "throughput": 3498.26, "total_tokens": 193750176} | |
| {"current_steps": 520, "total_steps": 3099, "loss": 0.0895, "lr": 4.931039797947498e-05, "epoch": 0.5034491104925571, "percentage": 16.78, "elapsed_time": "15:28:06", "remaining_time": "3 days, 4:43:04", "throughput": 3513.66, "total_tokens": 195664256} | |
| {"current_steps": 525, "total_steps": 3099, "loss": 0.0875, "lr": 4.9277169805151496e-05, "epoch": 0.5082899673242164, "percentage": 16.94, "elapsed_time": "15:33:56", "remaining_time": "3 days, 4:18:58", "throughput": 3525.87, "total_tokens": 197577536} | |
| {"current_steps": 530, "total_steps": 3099, "loss": 0.0907, "lr": 4.924317154410915e-05, "epoch": 0.5131308241558756, "percentage": 17.1, "elapsed_time": "15:39:45", "remaining_time": "3 days, 3:55:09", "throughput": 3537.11, "total_tokens": 199441664} | |
| {"current_steps": 535, "total_steps": 3099, "loss": 0.0851, "lr": 4.9208404274793615e-05, "epoch": 0.5179716809875348, "percentage": 17.26, "elapsed_time": "15:45:24", "remaining_time": "3 days, 3:30:53", "throughput": 3550.42, "total_tokens": 201395760} | |
| {"current_steps": 540, "total_steps": 3099, "loss": 0.0859, "lr": 4.917286910004402e-05, "epoch": 0.522812537819194, "percentage": 17.42, "elapsed_time": "15:50:47", "remaining_time": "3 days, 3:05:42", "throughput": 3563.5, "total_tokens": 203289168} | |
| {"current_steps": 545, "total_steps": 3099, "loss": 0.0932, "lr": 4.9136567147057886e-05, "epoch": 0.5276533946508531, "percentage": 17.59, "elapsed_time": "15:55:19", "remaining_time": "3 days, 2:36:54", "throughput": 3577.94, "total_tokens": 205086960} | |
| {"current_steps": 550, "total_steps": 3099, "loss": 0.0877, "lr": 4.9099499567355465e-05, "epoch": 0.5324942514825124, "percentage": 17.75, "elapsed_time": "16:01:16", "remaining_time": "3 days, 2:15:02", "throughput": 3589.68, "total_tokens": 207038560} | |
| {"current_steps": 555, "total_steps": 3099, "loss": 0.0849, "lr": 4.9061667536743096e-05, "epoch": 0.5373351083141716, "percentage": 17.91, "elapsed_time": "16:06:56", "remaining_time": "3 days, 1:52:15", "throughput": 3602.33, "total_tokens": 208994656} | |
| {"current_steps": 560, "total_steps": 3099, "loss": 0.0924, "lr": 4.9023072255276e-05, "epoch": 0.5421759651458308, "percentage": 18.07, "elapsed_time": "16:12:35", "remaining_time": "3 days, 1:29:37", "throughput": 3613.41, "total_tokens": 210860592} | |
| {"current_steps": 565, "total_steps": 3099, "loss": 0.0852, "lr": 4.89837149472202e-05, "epoch": 0.54701682197749, "percentage": 18.23, "elapsed_time": "16:18:46", "remaining_time": "3 days, 1:09:45", "throughput": 3623.96, "total_tokens": 212822400} | |
| {"current_steps": 570, "total_steps": 3099, "loss": 0.0894, "lr": 4.894359686101363e-05, "epoch": 0.5518576788091493, "percentage": 18.39, "elapsed_time": "16:24:41", "remaining_time": "3 days, 0:48:54", "throughput": 3634.82, "total_tokens": 214750096} | |
| {"current_steps": 575, "total_steps": 3099, "loss": 0.0859, "lr": 4.890271926922661e-05, "epoch": 0.5566985356408084, "percentage": 18.55, "elapsed_time": "16:31:06", "remaining_time": "3 days, 0:30:34", "throughput": 3644.78, "total_tokens": 216744256} | |
| {"current_steps": 580, "total_steps": 3099, "loss": 0.0843, "lr": 4.886108346852142e-05, "epoch": 0.5615393924724676, "percentage": 18.72, "elapsed_time": "16:35:59", "remaining_time": "3 days, 0:05:42", "throughput": 3658.29, "total_tokens": 218618416} | |
| {"current_steps": 585, "total_steps": 3099, "loss": 0.0881, "lr": 4.881869077961119e-05, "epoch": 0.5663802493041268, "percentage": 18.88, "elapsed_time": "16:41:11", "remaining_time": "2 days, 23:42:33", "throughput": 3670.18, "total_tokens": 220473312} | |
| {"current_steps": 590, "total_steps": 3099, "loss": 0.0838, "lr": 4.8775542547218035e-05, "epoch": 0.571221106135786, "percentage": 19.04, "elapsed_time": "16:47:11", "remaining_time": "2 days, 23:23:09", "throughput": 3680.74, "total_tokens": 222434400} | |
| {"current_steps": 595, "total_steps": 3099, "loss": 0.0823, "lr": 4.873164014003035e-05, "epoch": 0.5760619629674453, "percentage": 19.2, "elapsed_time": "16:52:41", "remaining_time": "2 days, 23:01:47", "throughput": 3692.24, "total_tokens": 224344864} | |
| {"current_steps": 600, "total_steps": 3099, "loss": 0.0908, "lr": 4.868698495065942e-05, "epoch": 0.5809028197991044, "percentage": 19.36, "elapsed_time": "16:59:32", "remaining_time": "2 days, 22:46:23", "throughput": 3699.79, "total_tokens": 226325424} | |
| {"current_steps": 605, "total_steps": 3099, "loss": 0.0841, "lr": 4.8641578395595244e-05, "epoch": 0.5857436766307637, "percentage": 19.52, "elapsed_time": "17:04:31", "remaining_time": "2 days, 22:23:26", "throughput": 3712.65, "total_tokens": 228223680} | |
| {"current_steps": 610, "total_steps": 3099, "loss": 0.09, "lr": 4.8595421915161606e-05, "epoch": 0.5905845334624229, "percentage": 19.68, "elapsed_time": "17:09:32", "remaining_time": "2 days, 22:00:53", "throughput": 3724.15, "total_tokens": 230051616} | |
| {"current_steps": 615, "total_steps": 3099, "loss": 0.0953, "lr": 4.854851697347038e-05, "epoch": 0.595425390294082, "percentage": 19.85, "elapsed_time": "17:13:36", "remaining_time": "2 days, 21:34:47", "throughput": 3737.44, "total_tokens": 231784640} | |
| {"current_steps": 620, "total_steps": 3099, "loss": 0.0818, "lr": 4.8500865058375084e-05, "epoch": 0.6002662471257413, "percentage": 20.01, "elapsed_time": "17:18:20", "remaining_time": "2 days, 21:11:41", "throughput": 3749.97, "total_tokens": 233624880} | |
| {"current_steps": 625, "total_steps": 3099, "loss": 0.0919, "lr": 4.845246768142371e-05, "epoch": 0.6051071039574004, "percentage": 20.17, "elapsed_time": "17:24:03", "remaining_time": "2 days, 20:52:48", "throughput": 3760.64, "total_tokens": 235580064} | |
| {"current_steps": 630, "total_steps": 3099, "loss": 0.0806, "lr": 4.840332637781072e-05, "epoch": 0.6099479607890597, "percentage": 20.33, "elapsed_time": "17:30:13", "remaining_time": "2 days, 20:35:51", "throughput": 3770.31, "total_tokens": 237579456} | |
| {"current_steps": 635, "total_steps": 3099, "loss": 0.0894, "lr": 4.835344270632844e-05, "epoch": 0.6147888176207189, "percentage": 20.49, "elapsed_time": "17:35:06", "remaining_time": "2 days, 20:14:08", "throughput": 3781.3, "total_tokens": 239379872} | |
| {"current_steps": 640, "total_steps": 3099, "loss": 0.0917, "lr": 4.830281824931751e-05, "epoch": 0.619629674452378, "percentage": 20.65, "elapsed_time": "17:41:00", "remaining_time": "2 days, 19:56:34", "throughput": 3791.13, "total_tokens": 241343936} | |
| {"current_steps": 645, "total_steps": 3099, "loss": 0.0949, "lr": 4.825145461261677e-05, "epoch": 0.6244705312840373, "percentage": 20.81, "elapsed_time": "17:45:56", "remaining_time": "2 days, 19:35:31", "throughput": 3801.45, "total_tokens": 243126480} | |
| {"current_steps": 650, "total_steps": 3099, "loss": 0.0836, "lr": 4.8199353425512276e-05, "epoch": 0.6293113881156964, "percentage": 20.97, "elapsed_time": "17:51:22", "remaining_time": "2 days, 19:16:35", "throughput": 3811.88, "total_tokens": 245036080} | |
| {"current_steps": 655, "total_steps": 3099, "loss": 0.0919, "lr": 4.814651634068565e-05, "epoch": 0.6341522449473557, "percentage": 21.14, "elapsed_time": "17:55:54", "remaining_time": "2 days, 18:54:31", "throughput": 3823.7, "total_tokens": 246836544} | |
| {"current_steps": 660, "total_steps": 3099, "loss": 0.0885, "lr": 4.809294503416164e-05, "epoch": 0.6389931017790149, "percentage": 21.3, "elapsed_time": "18:01:01", "remaining_time": "2 days, 18:34:52", "throughput": 3834.56, "total_tokens": 248715200} | |
| {"current_steps": 665, "total_steps": 3099, "loss": 0.0845, "lr": 4.8038641205254945e-05, "epoch": 0.643833958610674, "percentage": 21.46, "elapsed_time": "18:06:01", "remaining_time": "2 days, 18:15:01", "throughput": 3845.58, "total_tokens": 250584112} | |
| {"current_steps": 670, "total_steps": 3099, "loss": 0.0834, "lr": 4.7983606576516335e-05, "epoch": 0.6486748154423333, "percentage": 21.62, "elapsed_time": "18:10:46", "remaining_time": "2 days, 17:54:29", "throughput": 3857.27, "total_tokens": 252446000} | |
| {"current_steps": 675, "total_steps": 3099, "loss": 0.0889, "lr": 4.792784289367799e-05, "epoch": 0.6535156722739925, "percentage": 21.78, "elapsed_time": "18:16:46", "remaining_time": "2 days, 17:38:40", "throughput": 3864.89, "total_tokens": 254336512} | |
| {"current_steps": 680, "total_steps": 3099, "loss": 0.081, "lr": 4.787135192559814e-05, "epoch": 0.6583565291056517, "percentage": 21.94, "elapsed_time": "18:21:57", "remaining_time": "2 days, 17:20:03", "throughput": 3875.64, "total_tokens": 256248240} | |
| {"current_steps": 685, "total_steps": 3099, "loss": 0.0925, "lr": 4.781413546420494e-05, "epoch": 0.6631973859373109, "percentage": 22.1, "elapsed_time": "18:26:36", "remaining_time": "2 days, 16:59:47", "throughput": 3886.02, "total_tokens": 258018928} | |
| {"current_steps": 690, "total_steps": 3099, "loss": 0.081, "lr": 4.775619532443965e-05, "epoch": 0.6680382427689701, "percentage": 22.27, "elapsed_time": "18:33:01", "remaining_time": "2 days, 16:45:53", "throughput": 3893.92, "total_tokens": 260040928} | |
| {"current_steps": 695, "total_steps": 3099, "loss": 0.081, "lr": 4.7697533344199054e-05, "epoch": 0.6728790996006293, "percentage": 22.43, "elapsed_time": "18:38:31", "remaining_time": "2 days, 16:28:59", "throughput": 3903.73, "total_tokens": 261986240} | |
| {"current_steps": 700, "total_steps": 3099, "loss": 0.0834, "lr": 4.763815138427713e-05, "epoch": 0.6777199564322886, "percentage": 22.59, "elapsed_time": "18:43:09", "remaining_time": "2 days, 16:09:12", "throughput": 3914.7, "total_tokens": 263808880} | |
| {"current_steps": 705, "total_steps": 3099, "loss": 0.0858, "lr": 4.757805132830609e-05, "epoch": 0.6825608132639477, "percentage": 22.75, "elapsed_time": "18:48:13", "remaining_time": "2 days, 15:51:10", "throughput": 3924.47, "total_tokens": 265662032} | |
| {"current_steps": 710, "total_steps": 3099, "loss": 0.084, "lr": 4.751723508269659e-05, "epoch": 0.6874016700956069, "percentage": 22.91, "elapsed_time": "18:53:44", "remaining_time": "2 days, 15:34:48", "throughput": 3932.42, "total_tokens": 267501344} | |
| {"current_steps": 715, "total_steps": 3099, "loss": 0.0843, "lr": 4.745570457657722e-05, "epoch": 0.6922425269272662, "percentage": 23.07, "elapsed_time": "18:59:03", "remaining_time": "2 days, 15:17:53", "throughput": 3941.79, "total_tokens": 269394176} | |
| {"current_steps": 720, "total_steps": 3099, "loss": 0.0911, "lr": 4.7393461761733395e-05, "epoch": 0.6970833837589253, "percentage": 23.23, "elapsed_time": "19:05:05", "remaining_time": "2 days, 15:03:32", "throughput": 3948.59, "total_tokens": 271288208} | |
| {"current_steps": 725, "total_steps": 3099, "loss": 0.0759, "lr": 4.733050861254538e-05, "epoch": 0.7019242405905846, "percentage": 23.39, "elapsed_time": "19:10:04", "remaining_time": "2 days, 14:45:53", "throughput": 3958.45, "total_tokens": 273149952} | |
| {"current_steps": 730, "total_steps": 3099, "loss": 0.0874, "lr": 4.7266847125925686e-05, "epoch": 0.7067650974222437, "percentage": 23.56, "elapsed_time": "19:15:10", "remaining_time": "2 days, 14:28:45", "throughput": 3967.93, "total_tokens": 275017888} | |
| {"current_steps": 735, "total_steps": 3099, "loss": 0.0877, "lr": 4.720247932125572e-05, "epoch": 0.7116059542539029, "percentage": 23.72, "elapsed_time": "19:20:07", "remaining_time": "2 days, 14:11:19", "throughput": 3976.9, "total_tokens": 276821728} | |
| {"current_steps": 740, "total_steps": 3099, "loss": 0.0854, "lr": 4.713740724032173e-05, "epoch": 0.7164468110855622, "percentage": 23.88, "elapsed_time": "19:24:49", "remaining_time": "2 days, 13:53:16", "throughput": 3986.99, "total_tokens": 278648688} | |
| {"current_steps": 745, "total_steps": 3099, "loss": 0.0856, "lr": 4.7071632947250056e-05, "epoch": 0.7212876679172213, "percentage": 24.04, "elapsed_time": "19:30:20", "remaining_time": "2 days, 13:37:56", "throughput": 3995.63, "total_tokens": 280573744} | |
| {"current_steps": 750, "total_steps": 3099, "loss": 0.088, "lr": 4.700515852844161e-05, "epoch": 0.7261285247488806, "percentage": 24.2, "elapsed_time": "19:35:31", "remaining_time": "2 days, 13:21:45", "throughput": 4003.67, "total_tokens": 282386080} | |
| {"current_steps": 755, "total_steps": 3099, "loss": 0.0853, "lr": 4.6937986092505734e-05, "epoch": 0.7309693815805397, "percentage": 24.36, "elapsed_time": "19:39:36", "remaining_time": "2 days, 13:02:16", "throughput": 4014.93, "total_tokens": 284163392} | |
| {"current_steps": 760, "total_steps": 3099, "loss": 0.0897, "lr": 4.687011777019331e-05, "epoch": 0.735810238412199, "percentage": 24.52, "elapsed_time": "19:44:25", "remaining_time": "2 days, 12:45:12", "throughput": 4024.18, "total_tokens": 285979472} | |
| {"current_steps": 765, "total_steps": 3099, "loss": 0.0866, "lr": 4.680155571432915e-05, "epoch": 0.7406510952438582, "percentage": 24.69, "elapsed_time": "19:49:02", "remaining_time": "2 days, 12:27:43", "throughput": 4034.13, "total_tokens": 287803904} | |
| {"current_steps": 770, "total_steps": 3099, "loss": 0.084, "lr": 4.673230209974372e-05, "epoch": 0.7454919520755173, "percentage": 24.85, "elapsed_time": "19:54:51", "remaining_time": "2 days, 12:14:04", "throughput": 4041.89, "total_tokens": 289770544} | |
| {"current_steps": 775, "total_steps": 3099, "loss": 0.0847, "lr": 4.666235912320416e-05, "epoch": 0.7503328089071766, "percentage": 25.01, "elapsed_time": "19:59:51", "remaining_time": "2 days, 11:58:00", "throughput": 4051.05, "total_tokens": 291639680} | |
| {"current_steps": 780, "total_steps": 3099, "loss": 0.0855, "lr": 4.6591729003344604e-05, "epoch": 0.7551736657388358, "percentage": 25.17, "elapsed_time": "20:04:49", "remaining_time": "2 days, 11:42:01", "throughput": 4059.98, "total_tokens": 293493632} | |
| {"current_steps": 785, "total_steps": 3099, "loss": 0.0874, "lr": 4.652041398059577e-05, "epoch": 0.760014522570495, "percentage": 25.33, "elapsed_time": "20:10:13", "remaining_time": "2 days, 11:27:26", "throughput": 4068.37, "total_tokens": 295416672} | |
| {"current_steps": 790, "total_steps": 3099, "loss": 0.0917, "lr": 4.644841631711393e-05, "epoch": 0.7648553794021542, "percentage": 25.49, "elapsed_time": "20:14:58", "remaining_time": "2 days, 11:11:06", "throughput": 4077.33, "total_tokens": 297230848} | |
| {"current_steps": 795, "total_steps": 3099, "loss": 0.0862, "lr": 4.637573829670913e-05, "epoch": 0.7696962362338133, "percentage": 25.65, "elapsed_time": "20:21:20", "remaining_time": "2 days, 10:59:34", "throughput": 4083.23, "total_tokens": 299220432} | |
| {"current_steps": 800, "total_steps": 3099, "loss": 0.0876, "lr": 4.630238222477277e-05, "epoch": 0.7745370930654726, "percentage": 25.81, "elapsed_time": "20:26:39", "remaining_time": "2 days, 10:45:06", "throughput": 4091.12, "total_tokens": 301103984} | |
| {"current_steps": 805, "total_steps": 3099, "loss": 0.0832, "lr": 4.622835042820445e-05, "epoch": 0.7793779498971318, "percentage": 25.98, "elapsed_time": "20:31:42", "remaining_time": "2 days, 10:29:58", "throughput": 4100.06, "total_tokens": 303004240} | |
| {"current_steps": 810, "total_steps": 3099, "loss": 0.0875, "lr": 4.615364525533817e-05, "epoch": 0.784218806728791, "percentage": 26.14, "elapsed_time": "20:35:58", "remaining_time": "2 days, 10:12:45", "throughput": 4109.83, "total_tokens": 304776752} | |
| {"current_steps": 815, "total_steps": 3099, "loss": 0.0838, "lr": 4.6078269075867844e-05, "epoch": 0.7890596635604502, "percentage": 26.3, "elapsed_time": "20:40:43", "remaining_time": "2 days, 9:57:04", "throughput": 4118.09, "total_tokens": 306564704} | |
| {"current_steps": 820, "total_steps": 3099, "loss": 0.0831, "lr": 4.600222428077212e-05, "epoch": 0.7939005203921095, "percentage": 26.46, "elapsed_time": "20:46:16", "remaining_time": "2 days, 9:43:45", "throughput": 4124.85, "total_tokens": 308443424} | |
| {"current_steps": 825, "total_steps": 3099, "loss": 0.0861, "lr": 4.592551328223854e-05, "epoch": 0.7987413772237686, "percentage": 26.62, "elapsed_time": "20:51:14", "remaining_time": "2 days, 9:28:52", "throughput": 4133.59, "total_tokens": 310326496} | |
| {"current_steps": 830, "total_steps": 3099, "loss": 0.0868, "lr": 4.584813851358705e-05, "epoch": 0.8035822340554278, "percentage": 26.78, "elapsed_time": "20:58:15", "remaining_time": "2 days, 9:19:45", "throughput": 4136.99, "total_tokens": 312324656} | |
| {"current_steps": 835, "total_steps": 3099, "loss": 0.0823, "lr": 4.577010242919277e-05, "epoch": 0.808423090887087, "percentage": 26.94, "elapsed_time": "21:04:18", "remaining_time": "2 days, 9:08:00", "throughput": 4142.78, "total_tokens": 314264240} | |
| {"current_steps": 840, "total_steps": 3099, "loss": 0.0823, "lr": 4.569140750440817e-05, "epoch": 0.8132639477187462, "percentage": 27.11, "elapsed_time": "21:08:57", "remaining_time": "2 days, 8:52:35", "throughput": 4151.58, "total_tokens": 316091424} | |
| {"current_steps": 845, "total_steps": 3099, "loss": 0.0816, "lr": 4.561205623548453e-05, "epoch": 0.8181048045504055, "percentage": 27.27, "elapsed_time": "21:14:13", "remaining_time": "2 days, 8:38:56", "throughput": 4159.67, "total_tokens": 318022304} | |
| {"current_steps": 850, "total_steps": 3099, "loss": 0.0814, "lr": 4.5532051139492784e-05, "epoch": 0.8229456613820646, "percentage": 27.43, "elapsed_time": "21:19:41", "remaining_time": "2 days, 8:25:55", "throughput": 4166.21, "total_tokens": 319889920} | |
| {"current_steps": 855, "total_steps": 3099, "loss": 0.0855, "lr": 4.545139475424366e-05, "epoch": 0.8277865182137238, "percentage": 27.59, "elapsed_time": "21:25:37", "remaining_time": "2 days, 8:14:12", "throughput": 4171.82, "total_tokens": 321805040} | |
| {"current_steps": 860, "total_steps": 3099, "loss": 0.0859, "lr": 4.537008963820717e-05, "epoch": 0.832627375045383, "percentage": 27.75, "elapsed_time": "21:30:25", "remaining_time": "2 days, 7:59:37", "throughput": 4179.83, "total_tokens": 323627168} | |
| {"current_steps": 865, "total_steps": 3099, "loss": 0.0866, "lr": 4.5288138370431464e-05, "epoch": 0.8374682318770422, "percentage": 27.91, "elapsed_time": "21:35:13", "remaining_time": "2 days, 7:45:08", "throughput": 4187.82, "total_tokens": 325450784} | |
| {"current_steps": 870, "total_steps": 3099, "loss": 0.0794, "lr": 4.520554355046105e-05, "epoch": 0.8423090887087015, "percentage": 28.07, "elapsed_time": "21:40:21", "remaining_time": "2 days, 7:31:36", "throughput": 4195.41, "total_tokens": 327331824} | |
| {"current_steps": 875, "total_steps": 3099, "loss": 0.0853, "lr": 4.512230779825427e-05, "epoch": 0.8471499455403606, "percentage": 28.23, "elapsed_time": "21:44:53", "remaining_time": "2 days, 7:16:39", "throughput": 4204.26, "total_tokens": 329167072} | |
| {"current_steps": 880, "total_steps": 3099, "loss": 0.0862, "lr": 4.503843375410024e-05, "epoch": 0.8519908023720199, "percentage": 28.4, "elapsed_time": "21:49:48", "remaining_time": "2 days, 7:02:48", "throughput": 4211.95, "total_tokens": 331011792} | |
| {"current_steps": 885, "total_steps": 3099, "loss": 0.0862, "lr": 4.49539240785351e-05, "epoch": 0.8568316592036791, "percentage": 28.56, "elapsed_time": "21:53:59", "remaining_time": "2 days, 6:47:12", "throughput": 4220.72, "total_tokens": 332759152} | |
| {"current_steps": 890, "total_steps": 3099, "loss": 0.0854, "lr": 4.4868781452257604e-05, "epoch": 0.8616725160353382, "percentage": 28.72, "elapsed_time": "21:58:26", "remaining_time": "2 days, 6:32:25", "throughput": 4229.06, "total_tokens": 334548544} | |
| {"current_steps": 895, "total_steps": 3099, "loss": 0.081, "lr": 4.478300857604407e-05, "epoch": 0.8665133728669975, "percentage": 28.88, "elapsed_time": "22:04:07", "remaining_time": "2 days, 6:20:45", "throughput": 4235.25, "total_tokens": 336480736} | |
| {"current_steps": 900, "total_steps": 3099, "loss": 0.0799, "lr": 4.469660817066277e-05, "epoch": 0.8713542296986566, "percentage": 29.04, "elapsed_time": "22:09:48", "remaining_time": "2 days, 6:09:09", "throughput": 4241.55, "total_tokens": 338427280} | |
| {"current_steps": 905, "total_steps": 3099, "loss": 0.0828, "lr": 4.460958297678756e-05, "epoch": 0.8761950865303159, "percentage": 29.2, "elapsed_time": "22:15:40", "remaining_time": "2 days, 5:58:04", "throughput": 4246.94, "total_tokens": 340350320} | |
| {"current_steps": 910, "total_steps": 3099, "loss": 0.0815, "lr": 4.452193575491096e-05, "epoch": 0.8810359433619751, "percentage": 29.36, "elapsed_time": "22:20:47", "remaining_time": "2 days, 5:45:17", "throughput": 4254.01, "total_tokens": 342226288} | |
| {"current_steps": 915, "total_steps": 3099, "loss": 0.0813, "lr": 4.443366928525663e-05, "epoch": 0.8858768001936342, "percentage": 29.53, "elapsed_time": "22:26:43", "remaining_time": "2 days, 5:34:29", "throughput": 4259.74, "total_tokens": 344202544} | |
| {"current_steps": 920, "total_steps": 3099, "loss": 0.0889, "lr": 4.4344786367691125e-05, "epoch": 0.8907176570252935, "percentage": 29.69, "elapsed_time": "22:31:59", "remaining_time": "2 days, 5:22:10", "throughput": 4266.47, "total_tokens": 346094384} | |
| {"current_steps": 925, "total_steps": 3099, "loss": 0.0806, "lr": 4.425528982163512e-05, "epoch": 0.8955585138569527, "percentage": 29.85, "elapsed_time": "22:37:37", "remaining_time": "2 days, 5:10:47", "throughput": 4272.28, "total_tokens": 348009840} | |
| {"current_steps": 930, "total_steps": 3099, "loss": 0.0816, "lr": 4.416518248597395e-05, "epoch": 0.9003993706886119, "percentage": 30.01, "elapsed_time": "22:43:10", "remaining_time": "2 days, 4:59:16", "throughput": 4278.28, "total_tokens": 349923616} | |
| {"current_steps": 935, "total_steps": 3099, "loss": 0.0808, "lr": 4.4074467218967594e-05, "epoch": 0.9052402275202711, "percentage": 30.17, "elapsed_time": "22:50:23", "remaining_time": "2 days, 4:51:42", "throughput": 4280.78, "total_tokens": 351982800} | |
| {"current_steps": 940, "total_steps": 3099, "loss": 0.086, "lr": 4.398314689815995e-05, "epoch": 0.9100810843519302, "percentage": 30.33, "elapsed_time": "22:55:22", "remaining_time": "2 days, 4:38:58", "throughput": 4287.35, "total_tokens": 353803568} | |
| {"current_steps": 945, "total_steps": 3099, "loss": 0.0792, "lr": 4.389122442028762e-05, "epoch": 0.9149219411835895, "percentage": 30.49, "elapsed_time": "23:01:02", "remaining_time": "2 days, 4:27:53", "throughput": 4293.51, "total_tokens": 355770400} | |
| {"current_steps": 950, "total_steps": 3099, "loss": 0.0789, "lr": 4.379870270118801e-05, "epoch": 0.9197627980152487, "percentage": 30.66, "elapsed_time": "23:06:51", "remaining_time": "2 days, 4:17:12", "throughput": 4298.98, "total_tokens": 357722704} | |
| {"current_steps": 955, "total_steps": 3099, "loss": 0.0784, "lr": 4.370558467570678e-05, "epoch": 0.9246036548469079, "percentage": 30.82, "elapsed_time": "23:11:42", "remaining_time": "2 days, 4:04:24", "throughput": 4306.77, "total_tokens": 359625392} | |
| {"current_steps": 960, "total_steps": 3099, "loss": 0.0812, "lr": 4.361187329760483e-05, "epoch": 0.9294445116785671, "percentage": 30.98, "elapsed_time": "23:16:35", "remaining_time": "2 days, 3:51:47", "throughput": 4313.81, "total_tokens": 361478880} | |
| {"current_steps": 965, "total_steps": 3099, "loss": 0.0831, "lr": 4.351757153946456e-05, "epoch": 0.9342853685102263, "percentage": 31.14, "elapsed_time": "23:22:04", "remaining_time": "2 days, 3:40:32", "throughput": 4319.81, "total_tokens": 363401552} | |
| {"current_steps": 970, "total_steps": 3099, "loss": 0.077, "lr": 4.3422682392595594e-05, "epoch": 0.9391262253418855, "percentage": 31.3, "elapsed_time": "23:26:35", "remaining_time": "2 days, 3:27:15", "throughput": 4327.9, "total_tokens": 365256960} | |
| {"current_steps": 975, "total_steps": 3099, "loss": 0.0781, "lr": 4.332720886693987e-05, "epoch": 0.9439670821735447, "percentage": 31.46, "elapsed_time": "23:32:17", "remaining_time": "2 days, 3:16:36", "throughput": 4333.02, "total_tokens": 367167264} | |
| {"current_steps": 980, "total_steps": 3099, "loss": 0.084, "lr": 4.32311539909762e-05, "epoch": 0.9488079390052039, "percentage": 31.62, "elapsed_time": "23:38:26", "remaining_time": "2 days, 3:07:00", "throughput": 4335.47, "total_tokens": 368976208} | |
| {"current_steps": 985, "total_steps": 3099, "loss": 0.0829, "lr": 4.313452081162416e-05, "epoch": 0.9536487958368631, "percentage": 31.78, "elapsed_time": "23:52:16", "remaining_time": "2 days, 3:13:56", "throughput": 4315.54, "total_tokens": 370862208} | |
| {"current_steps": 990, "total_steps": 3099, "loss": 0.0859, "lr": 4.303731239414749e-05, "epoch": 0.9584896526685224, "percentage": 31.95, "elapsed_time": "1 day, 0:05:38", "remaining_time": "2 days, 3:19:38", "throughput": 4297.06, "total_tokens": 372719648} | |
| {"current_steps": 995, "total_steps": 3099, "loss": 0.0869, "lr": 4.2939531822056815e-05, "epoch": 0.9633305095001815, "percentage": 32.11, "elapsed_time": "1 day, 0:19:18", "remaining_time": "2 days, 3:25:47", "throughput": 4278.59, "total_tokens": 374624944} | |
| {"current_steps": 1000, "total_steps": 3099, "loss": 0.0794, "lr": 4.284118219701187e-05, "epoch": 0.9681713663318408, "percentage": 32.27, "elapsed_time": "1 day, 0:32:03", "remaining_time": "2 days, 3:29:50", "throughput": 4263.05, "total_tokens": 376525888} | |
| {"current_steps": 1005, "total_steps": 3099, "loss": 0.0804, "lr": 4.2742266638723096e-05, "epoch": 0.9730122231634999, "percentage": 32.43, "elapsed_time": "1 day, 0:47:25", "remaining_time": "2 days, 3:39:09", "throughput": 4241.55, "total_tokens": 378537840} | |
| {"current_steps": 1010, "total_steps": 3099, "loss": 0.0845, "lr": 4.264278828485267e-05, "epoch": 0.9778530799951591, "percentage": 32.59, "elapsed_time": "1 day, 1:01:19", "remaining_time": "2 days, 3:45:13", "throughput": 4222.9, "total_tokens": 380397552} | |
| {"current_steps": 1015, "total_steps": 3099, "loss": 0.089, "lr": 4.254275029091501e-05, "epoch": 0.9826939368268184, "percentage": 32.75, "elapsed_time": "1 day, 1:15:22", "remaining_time": "2 days, 3:51:23", "throughput": 4203.46, "total_tokens": 382191440} | |
| {"current_steps": 1020, "total_steps": 3099, "loss": 0.0887, "lr": 4.2442155830176655e-05, "epoch": 0.9875347936584775, "percentage": 32.91, "elapsed_time": "1 day, 1:29:13", "remaining_time": "2 days, 3:56:55", "throughput": 4185.73, "total_tokens": 384056752} | |
| {"current_steps": 1025, "total_steps": 3099, "loss": 0.0833, "lr": 4.2341008093555604e-05, "epoch": 0.9923756504901368, "percentage": 33.08, "elapsed_time": "1 day, 1:43:22", "remaining_time": "2 days, 4:02:53", "throughput": 4168.07, "total_tokens": 385974032} | |
| {"current_steps": 1030, "total_steps": 3099, "loss": 0.0807, "lr": 4.22393102895201e-05, "epoch": 0.997216507321796, "percentage": 33.24, "elapsed_time": "1 day, 1:57:06", "remaining_time": "2 days, 4:07:49", "throughput": 4151.76, "total_tokens": 387884720} | |
| {"current_steps": 1035, "total_steps": 3099, "loss": 0.0727, "lr": 4.213706564398688e-05, "epoch": 1.0019363427326637, "percentage": 33.4, "elapsed_time": "1 day, 2:10:54", "remaining_time": "2 days, 4:12:43", "throughput": 4134.38, "total_tokens": 389685952} | |
| {"current_steps": 1040, "total_steps": 3099, "loss": 0.0713, "lr": 4.203427740021884e-05, "epoch": 1.0067771995643229, "percentage": 33.56, "elapsed_time": "1 day, 2:26:08", "remaining_time": "2 days, 4:20:15", "throughput": 4115.06, "total_tokens": 391624192} | |
| {"current_steps": 1045, "total_steps": 3099, "loss": 0.0671, "lr": 4.1930948818722104e-05, "epoch": 1.011618056395982, "percentage": 33.72, "elapsed_time": "1 day, 2:42:31", "remaining_time": "2 days, 4:29:49", "throughput": 4094.19, "total_tokens": 393660384} | |
| {"current_steps": 1050, "total_steps": 3099, "loss": 0.0686, "lr": 4.182708317714267e-05, "epoch": 1.0164589132276414, "percentage": 33.88, "elapsed_time": "1 day, 2:56:00", "remaining_time": "2 days, 4:33:30", "throughput": 4079.29, "total_tokens": 395529008} | |
| {"current_steps": 1055, "total_steps": 3099, "loss": 0.0684, "lr": 4.172268377016241e-05, "epoch": 1.0212997700593005, "percentage": 34.04, "elapsed_time": "1 day, 3:08:31", "remaining_time": "2 days, 4:35:11", "throughput": 4066.52, "total_tokens": 397347360} | |
| {"current_steps": 1060, "total_steps": 3099, "loss": 0.0664, "lr": 4.161775390939454e-05, "epoch": 1.0261406268909596, "percentage": 34.2, "elapsed_time": "1 day, 3:23:35", "remaining_time": "2 days, 4:41:35", "throughput": 4049.01, "total_tokens": 399294608} | |
| {"current_steps": 1065, "total_steps": 3099, "loss": 0.0657, "lr": 4.151229692327863e-05, "epoch": 1.030981483722619, "percentage": 34.37, "elapsed_time": "1 day, 3:38:44", "remaining_time": "2 days, 4:47:58", "throughput": 4031.48, "total_tokens": 401232320} | |
| {"current_steps": 1070, "total_steps": 3099, "loss": 0.0668, "lr": 4.1406316156974965e-05, "epoch": 1.0358223405542781, "percentage": 34.53, "elapsed_time": "1 day, 3:54:51", "remaining_time": "2 days, 4:55:58", "throughput": 4011.85, "total_tokens": 403156576} | |
| {"current_steps": 1075, "total_steps": 3099, "loss": 0.0685, "lr": 4.1299814972258466e-05, "epoch": 1.0406631973859373, "percentage": 34.69, "elapsed_time": "1 day, 4:07:07", "remaining_time": "2 days, 4:56:29", "throughput": 4000.65, "total_tokens": 404973808} | |
| {"current_steps": 1080, "total_steps": 3099, "loss": 0.0739, "lr": 4.1192796747412046e-05, "epoch": 1.0455040542175964, "percentage": 34.85, "elapsed_time": "1 day, 4:21:08", "remaining_time": "2 days, 5:00:12", "throughput": 3986.1, "total_tokens": 406856480} | |
| {"current_steps": 1085, "total_steps": 3099, "loss": 0.0743, "lr": 4.108526487711944e-05, "epoch": 1.0503449110492558, "percentage": 35.01, "elapsed_time": "1 day, 4:35:04", "remaining_time": "2 days, 5:03:33", "throughput": 3971.24, "total_tokens": 408659088} | |
| {"current_steps": 1090, "total_steps": 3099, "loss": 0.0674, "lr": 4.0977222772357545e-05, "epoch": 1.055185767880915, "percentage": 35.17, "elapsed_time": "1 day, 4:48:13", "remaining_time": "2 days, 5:05:20", "throughput": 3959.09, "total_tokens": 410533120} | |
| {"current_steps": 1095, "total_steps": 3099, "loss": 0.0723, "lr": 4.0868673860288196e-05, "epoch": 1.060026624712574, "percentage": 35.33, "elapsed_time": "1 day, 5:01:23", "remaining_time": "2 days, 5:06:58", "throughput": 3946.84, "total_tokens": 412377808} | |
| {"current_steps": 1100, "total_steps": 3099, "loss": 0.0659, "lr": 4.075962158414948e-05, "epoch": 1.0648674815442334, "percentage": 35.5, "elapsed_time": "1 day, 5:17:59", "remaining_time": "2 days, 5:14:45", "throughput": 3928.62, "total_tokens": 414390304} | |
| {"current_steps": 1105, "total_steps": 3099, "loss": 0.0671, "lr": 4.0650069403146484e-05, "epoch": 1.0697083383758925, "percentage": 35.66, "elapsed_time": "1 day, 5:35:09", "remaining_time": "2 days, 5:23:19", "throughput": 3909.63, "total_tokens": 416413616} | |
| {"current_steps": 1110, "total_steps": 3099, "loss": 0.0723, "lr": 4.0540020792341605e-05, "epoch": 1.0745491952075517, "percentage": 35.82, "elapsed_time": "1 day, 5:49:43", "remaining_time": "2 days, 5:27:00", "throughput": 3895.06, "total_tokens": 418267408} | |
| {"current_steps": 1115, "total_steps": 3099, "loss": 0.0676, "lr": 4.0429479242544285e-05, "epoch": 1.079390052039211, "percentage": 35.98, "elapsed_time": "1 day, 6:02:58", "remaining_time": "2 days, 5:28:10", "throughput": 3883.58, "total_tokens": 420122000} | |
| {"current_steps": 1120, "total_steps": 3099, "loss": 0.0673, "lr": 4.031844826020028e-05, "epoch": 1.0842309088708701, "percentage": 36.14, "elapsed_time": "1 day, 6:16:24", "remaining_time": "2 days, 5:29:30", "throughput": 3871.94, "total_tokens": 421979504} | |
| {"current_steps": 1125, "total_steps": 3099, "loss": 0.0716, "lr": 4.020693136728047e-05, "epoch": 1.0890717657025293, "percentage": 36.3, "elapsed_time": "1 day, 6:30:48", "remaining_time": "2 days, 5:32:28", "throughput": 3858.5, "total_tokens": 423852128} | |
| {"current_steps": 1130, "total_steps": 3099, "loss": 0.066, "lr": 4.0094932101169116e-05, "epoch": 1.0939126225341886, "percentage": 36.46, "elapsed_time": "1 day, 6:47:09", "remaining_time": "2 days, 5:38:37", "throughput": 3842.54, "total_tokens": 425865744} | |
| {"current_steps": 1135, "total_steps": 3099, "loss": 0.0671, "lr": 3.9982454014551626e-05, "epoch": 1.0987534793658478, "percentage": 36.62, "elapsed_time": "1 day, 7:01:17", "remaining_time": "2 days, 5:40:46", "throughput": 3830.89, "total_tokens": 427825520} | |
| {"current_steps": 1140, "total_steps": 3099, "loss": 0.0659, "lr": 3.9869500675301925e-05, "epoch": 1.103594336197507, "percentage": 36.79, "elapsed_time": "1 day, 7:14:12", "remaining_time": "2 days, 5:40:40", "throughput": 3820.74, "total_tokens": 429650464} | |
| {"current_steps": 1145, "total_steps": 3099, "loss": 0.0674, "lr": 3.975607566636921e-05, "epoch": 1.1084351930291663, "percentage": 36.95, "elapsed_time": "1 day, 7:28:19", "remaining_time": "2 days, 5:42:32", "throughput": 3809.01, "total_tokens": 431560992} | |
| {"current_steps": 1150, "total_steps": 3099, "loss": 0.0679, "lr": 3.964218258566436e-05, "epoch": 1.1132760498608254, "percentage": 37.11, "elapsed_time": "1 day, 7:42:00", "remaining_time": "2 days, 5:43:29", "throughput": 3798.19, "total_tokens": 433452176} | |
| {"current_steps": 1155, "total_steps": 3099, "loss": 0.0683, "lr": 3.952782504594574e-05, "epoch": 1.1181169066924845, "percentage": 37.27, "elapsed_time": "1 day, 7:55:32", "remaining_time": "2 days, 5:44:03", "throughput": 3788.08, "total_tokens": 435371936} | |
| {"current_steps": 1160, "total_steps": 3099, "loss": 0.0696, "lr": 3.9413006674704684e-05, "epoch": 1.1229577635241437, "percentage": 37.43, "elapsed_time": "1 day, 8:08:43", "remaining_time": "2 days, 5:43:57", "throughput": 3777.9, "total_tokens": 437191424} | |
| {"current_steps": 1165, "total_steps": 3099, "loss": 0.0693, "lr": 3.929773111405034e-05, "epoch": 1.127798620355803, "percentage": 37.59, "elapsed_time": "1 day, 8:22:32", "remaining_time": "2 days, 5:44:47", "throughput": 3766.92, "total_tokens": 439045440} | |
| {"current_steps": 1170, "total_steps": 3099, "loss": 0.0705, "lr": 3.9182002020594235e-05, "epoch": 1.1326394771874622, "percentage": 37.75, "elapsed_time": "1 day, 8:37:41", "remaining_time": "2 days, 5:47:41", "throughput": 3753.99, "total_tokens": 440950928} | |
| {"current_steps": 1175, "total_steps": 3099, "loss": 0.0638, "lr": 3.906582306533418e-05, "epoch": 1.1374803340191213, "percentage": 37.92, "elapsed_time": "1 day, 8:54:14", "remaining_time": "2 days, 5:52:43", "throughput": 3739.1, "total_tokens": 442914960} | |
| {"current_steps": 1180, "total_steps": 3099, "loss": 0.0689, "lr": 3.8949197933537916e-05, "epoch": 1.1423211908507807, "percentage": 38.08, "elapsed_time": "1 day, 9:08:57", "remaining_time": "2 days, 5:54:34", "throughput": 3727.52, "total_tokens": 444832176} | |
| {"current_steps": 1185, "total_steps": 3099, "loss": 0.0682, "lr": 3.883213032462617e-05, "epoch": 1.1471620476824398, "percentage": 38.24, "elapsed_time": "1 day, 9:24:13", "remaining_time": "2 days, 5:57:12", "throughput": 3715.31, "total_tokens": 446780448} | |
| {"current_steps": 1190, "total_steps": 3099, "loss": 0.071, "lr": 3.871462395205531e-05, "epoch": 1.152002904514099, "percentage": 38.4, "elapsed_time": "1 day, 9:36:43", "remaining_time": "2 days, 5:55:13", "throughput": 3706.92, "total_tokens": 448550288} | |
| {"current_steps": 1195, "total_steps": 3099, "loss": 0.068, "lr": 3.8596682543199546e-05, "epoch": 1.1568437613457583, "percentage": 38.56, "elapsed_time": "1 day, 9:50:45", "remaining_time": "2 days, 5:55:36", "throughput": 3696.92, "total_tokens": 450450928} | |
| {"current_steps": 1200, "total_steps": 3099, "loss": 0.0687, "lr": 3.847830983923273e-05, "epoch": 1.1616846181774174, "percentage": 38.72, "elapsed_time": "1 day, 10:07:44", "remaining_time": "2 days, 6:00:33", "throughput": 3682.25, "total_tokens": 452419728} | |
| {"current_steps": 1205, "total_steps": 3099, "loss": 0.0719, "lr": 3.835950959500963e-05, "epoch": 1.1665254750090766, "percentage": 38.88, "elapsed_time": "1 day, 10:21:16", "remaining_time": "2 days, 5:59:52", "throughput": 3672.97, "total_tokens": 454259472} | |
| {"current_steps": 1210, "total_steps": 3099, "loss": 0.069, "lr": 3.8240285578946904e-05, "epoch": 1.1713663318407357, "percentage": 39.04, "elapsed_time": "1 day, 10:37:07", "remaining_time": "2 days, 6:02:42", "throughput": 3660.24, "total_tokens": 456165264} | |
| {"current_steps": 1215, "total_steps": 3099, "loss": 0.0666, "lr": 3.812064157290345e-05, "epoch": 1.176207188672395, "percentage": 39.21, "elapsed_time": "1 day, 10:51:09", "remaining_time": "2 days, 6:02:35", "throughput": 3650.65, "total_tokens": 458044704} | |
| {"current_steps": 1220, "total_steps": 3099, "loss": 0.0666, "lr": 3.800058137206053e-05, "epoch": 1.1810480455040542, "percentage": 39.37, "elapsed_time": "1 day, 11:05:28", "remaining_time": "2 days, 6:02:46", "throughput": 3640.63, "total_tokens": 459916000} | |
| {"current_steps": 1225, "total_steps": 3099, "loss": 0.0721, "lr": 3.788010878480139e-05, "epoch": 1.1858889023357135, "percentage": 39.53, "elapsed_time": "1 day, 11:20:50", "remaining_time": "2 days, 6:04:27", "throughput": 3628.95, "total_tokens": 461786304} | |
| {"current_steps": 1230, "total_steps": 3099, "loss": 0.0661, "lr": 3.775922763259038e-05, "epoch": 1.1907297591673727, "percentage": 39.69, "elapsed_time": "1 day, 11:36:00", "remaining_time": "2 days, 6:05:41", "throughput": 3617.93, "total_tokens": 463676192} | |
| {"current_steps": 1235, "total_steps": 3099, "loss": 0.0705, "lr": 3.763794174985181e-05, "epoch": 1.1955706159990318, "percentage": 39.85, "elapsed_time": "1 day, 11:50:02", "remaining_time": "2 days, 6:05:04", "throughput": 3609.26, "total_tokens": 465602880} | |
| {"current_steps": 1240, "total_steps": 3099, "loss": 0.0698, "lr": 3.7516254983848277e-05, "epoch": 1.200411472830691, "percentage": 40.01, "elapsed_time": "1 day, 12:02:23", "remaining_time": "2 days, 6:01:50", "throughput": 3603.22, "total_tokens": 467493856} | |
| {"current_steps": 1245, "total_steps": 3099, "loss": 0.0693, "lr": 3.7394171194558646e-05, "epoch": 1.2052523296623503, "percentage": 40.17, "elapsed_time": "1 day, 12:14:19", "remaining_time": "2 days, 5:57:54", "throughput": 3598.8, "total_tokens": 469496768} | |
| {"current_steps": 1250, "total_steps": 3099, "loss": 0.0693, "lr": 3.727169425455562e-05, "epoch": 1.2100931864940094, "percentage": 40.34, "elapsed_time": "1 day, 12:23:29", "remaining_time": "2 days, 5:49:49", "throughput": 3598.58, "total_tokens": 471449056} | |
| {"current_steps": 1255, "total_steps": 3099, "loss": 0.0697, "lr": 3.7148828048882857e-05, "epoch": 1.2149340433256686, "percentage": 40.5, "elapsed_time": "1 day, 12:33:25", "remaining_time": "2 days, 5:42:51", "throughput": 3596.08, "total_tokens": 473264848} | |
| {"current_steps": 1260, "total_steps": 3099, "loss": 0.069, "lr": 3.702557647493177e-05, "epoch": 1.219774900157328, "percentage": 40.66, "elapsed_time": "1 day, 12:41:46", "remaining_time": "2 days, 5:33:33", "throughput": 3596.67, "total_tokens": 475144208} | |
| {"current_steps": 1265, "total_steps": 3099, "loss": 0.0671, "lr": 3.690194344231789e-05, "epoch": 1.224615756988987, "percentage": 40.82, "elapsed_time": "1 day, 12:48:51", "remaining_time": "2 days, 5:22:24", "throughput": 3600.04, "total_tokens": 477118864} | |
| {"current_steps": 1270, "total_steps": 3099, "loss": 0.0697, "lr": 3.677793287275687e-05, "epoch": 1.2294566138206462, "percentage": 40.98, "elapsed_time": "1 day, 12:53:54", "remaining_time": "2 days, 5:08:22", "throughput": 3605.88, "total_tokens": 478984544} | |
| {"current_steps": 1275, "total_steps": 3099, "loss": 0.073, "lr": 3.665354869994003e-05, "epoch": 1.2342974706523056, "percentage": 41.14, "elapsed_time": "1 day, 12:59:10", "remaining_time": "2 days, 4:54:42", "throughput": 3611.43, "total_tokens": 480862384} | |
| {"current_steps": 1280, "total_steps": 3099, "loss": 0.071, "lr": 3.652879486940965e-05, "epoch": 1.2391383274839647, "percentage": 41.3, "elapsed_time": "1 day, 13:04:20", "remaining_time": "2 days, 4:40:59", "throughput": 3616.48, "total_tokens": 482657712} | |
| {"current_steps": 1285, "total_steps": 3099, "loss": 0.0694, "lr": 3.640367533843376e-05, "epoch": 1.2439791843156238, "percentage": 41.46, "elapsed_time": "1 day, 13:09:56", "remaining_time": "2 days, 4:27:57", "throughput": 3621.36, "total_tokens": 484527216} | |
| {"current_steps": 1290, "total_steps": 3099, "loss": 0.0664, "lr": 3.6278194075880625e-05, "epoch": 1.2488200411472832, "percentage": 41.63, "elapsed_time": "1 day, 13:14:57", "remaining_time": "2 days, 4:14:08", "throughput": 3627.39, "total_tokens": 486424320} | |
| {"current_steps": 1295, "total_steps": 3099, "loss": 0.0686, "lr": 3.615235506209288e-05, "epoch": 1.2536608979789423, "percentage": 41.79, "elapsed_time": "1 day, 13:21:12", "remaining_time": "2 days, 4:02:06", "throughput": 3632.39, "total_tokens": 488454832} | |
| {"current_steps": 1300, "total_steps": 3099, "loss": 0.0616, "lr": 3.602616228876123e-05, "epoch": 1.2585017548106014, "percentage": 41.95, "elapsed_time": "1 day, 13:26:41", "remaining_time": "2 days, 3:49:04", "throughput": 3638.0, "total_tokens": 490406800} | |
| {"current_steps": 1305, "total_steps": 3099, "loss": 0.0675, "lr": 3.589961975879787e-05, "epoch": 1.2633426116422606, "percentage": 42.11, "elapsed_time": "1 day, 13:32:09", "remaining_time": "2 days, 3:36:04", "throughput": 3643.32, "total_tokens": 492319664} | |
| {"current_steps": 1310, "total_steps": 3099, "loss": 0.0693, "lr": 3.577273148620946e-05, "epoch": 1.26818346847392, "percentage": 42.27, "elapsed_time": "1 day, 13:37:41", "remaining_time": "2 days, 3:23:12", "throughput": 3648.4, "total_tokens": 494216816} | |
| {"current_steps": 1315, "total_steps": 3099, "loss": 0.0699, "lr": 3.564550149596985e-05, "epoch": 1.273024325305579, "percentage": 42.43, "elapsed_time": "1 day, 13:42:50", "remaining_time": "2 days, 3:09:53", "throughput": 3653.56, "total_tokens": 496046624} | |
| {"current_steps": 1320, "total_steps": 3099, "loss": 0.0755, "lr": 3.5517933823892384e-05, "epoch": 1.2778651821372382, "percentage": 42.59, "elapsed_time": "1 day, 13:48:06", "remaining_time": "2 days, 2:56:47", "throughput": 3658.53, "total_tokens": 497876768} | |
| {"current_steps": 1325, "total_steps": 3099, "loss": 0.0786, "lr": 3.539003251650188e-05, "epoch": 1.2827060389688976, "percentage": 42.76, "elapsed_time": "1 day, 13:53:28", "remaining_time": "2 days, 2:43:53", "throughput": 3663.25, "total_tokens": 499699664} | |
| {"current_steps": 1330, "total_steps": 3099, "loss": 0.0683, "lr": 3.526180163090627e-05, "epoch": 1.2875468958005567, "percentage": 42.92, "elapsed_time": "1 day, 13:58:17", "remaining_time": "2 days, 2:30:18", "throughput": 3668.94, "total_tokens": 501536176} | |
| {"current_steps": 1335, "total_steps": 3099, "loss": 0.0688, "lr": 3.5133245234667883e-05, "epoch": 1.2923877526322158, "percentage": 43.08, "elapsed_time": "1 day, 14:03:22", "remaining_time": "2 days, 2:17:07", "throughput": 3674.17, "total_tokens": 503368832} | |
| {"current_steps": 1340, "total_steps": 3099, "loss": 0.0675, "lr": 3.50043674056745e-05, "epoch": 1.297228609463875, "percentage": 43.24, "elapsed_time": "1 day, 14:08:46", "remaining_time": "2 days, 2:04:26", "throughput": 3679.34, "total_tokens": 505269776} | |
| {"current_steps": 1345, "total_steps": 3099, "loss": 0.0646, "lr": 3.48751722320099e-05, "epoch": 1.3020694662955343, "percentage": 43.4, "elapsed_time": "1 day, 14:14:15", "remaining_time": "2 days, 1:51:54", "throughput": 3684.47, "total_tokens": 507187600} | |
| {"current_steps": 1350, "total_steps": 3099, "loss": 0.0701, "lr": 3.4745663811824234e-05, "epoch": 1.3069103231271935, "percentage": 43.56, "elapsed_time": "1 day, 14:18:52", "remaining_time": "2 days, 1:38:18", "throughput": 3690.23, "total_tokens": 509000368} | |
| {"current_steps": 1355, "total_steps": 3099, "loss": 0.0672, "lr": 3.461584625320407e-05, "epoch": 1.3117511799588528, "percentage": 43.72, "elapsed_time": "1 day, 14:23:30", "remaining_time": "2 days, 1:24:49", "throughput": 3695.89, "total_tokens": 510812240} | |
| {"current_steps": 1360, "total_steps": 3099, "loss": 0.0753, "lr": 3.448572367404197e-05, "epoch": 1.316592036790512, "percentage": 43.89, "elapsed_time": "1 day, 14:28:54", "remaining_time": "2 days, 1:12:20", "throughput": 3700.44, "total_tokens": 512638608} | |
| {"current_steps": 1365, "total_steps": 3099, "loss": 0.0666, "lr": 3.435530020190598e-05, "epoch": 1.321432893622171, "percentage": 44.05, "elapsed_time": "1 day, 14:33:25", "remaining_time": "2 days, 0:58:48", "throughput": 3706.34, "total_tokens": 514458464} | |
| {"current_steps": 1370, "total_steps": 3099, "loss": 0.0675, "lr": 3.422457997390865e-05, "epoch": 1.3262737504538302, "percentage": 44.21, "elapsed_time": "1 day, 14:37:59", "remaining_time": "2 days, 0:45:24", "throughput": 3712.13, "total_tokens": 516280880} | |
| {"current_steps": 1375, "total_steps": 3099, "loss": 0.0726, "lr": 3.4093567136575794e-05, "epoch": 1.3311146072854896, "percentage": 44.37, "elapsed_time": "1 day, 14:43:06", "remaining_time": "2 days, 0:32:45", "throughput": 3717.39, "total_tokens": 518154288} | |
| {"current_steps": 1380, "total_steps": 3099, "loss": 0.0747, "lr": 3.396226584571499e-05, "epoch": 1.3359554641171487, "percentage": 44.53, "elapsed_time": "1 day, 14:48:09", "remaining_time": "2 days, 0:20:04", "throughput": 3722.44, "total_tokens": 519986144} | |
| {"current_steps": 1385, "total_steps": 3099, "loss": 0.07, "lr": 3.383068026628371e-05, "epoch": 1.340796320948808, "percentage": 44.69, "elapsed_time": "1 day, 14:53:07", "remaining_time": "2 days, 0:07:20", "throughput": 3727.93, "total_tokens": 521862240} | |
| {"current_steps": 1390, "total_steps": 3099, "loss": 0.0665, "lr": 3.3698814572257284e-05, "epoch": 1.3456371777804672, "percentage": 44.85, "elapsed_time": "1 day, 14:58:57", "remaining_time": "1 day, 23:55:44", "throughput": 3732.85, "total_tokens": 523858656} | |
| {"current_steps": 1395, "total_steps": 3099, "loss": 0.0675, "lr": 3.356667294649639e-05, "epoch": 1.3504780346121263, "percentage": 45.01, "elapsed_time": "1 day, 15:04:30", "remaining_time": "1 day, 23:43:49", "throughput": 3737.63, "total_tokens": 525774560} | |
| {"current_steps": 1400, "total_steps": 3099, "loss": 0.0662, "lr": 3.343425958061447e-05, "epoch": 1.3553188914437855, "percentage": 45.18, "elapsed_time": "1 day, 15:09:54", "remaining_time": "1 day, 23:31:46", "throughput": 3742.58, "total_tokens": 527681344} | |
| {"current_steps": 1405, "total_steps": 3099, "loss": 0.0717, "lr": 3.330157867484472e-05, "epoch": 1.3601597482754448, "percentage": 45.34, "elapsed_time": "1 day, 15:13:55", "remaining_time": "1 day, 23:18:06", "throughput": 3748.4, "total_tokens": 529406736} | |
| {"current_steps": 1410, "total_steps": 3099, "loss": 0.0662, "lr": 3.3168634437906865e-05, "epoch": 1.365000605107104, "percentage": 45.5, "elapsed_time": "1 day, 15:19:06", "remaining_time": "1 day, 23:05:55", "throughput": 3753.57, "total_tokens": 531305872} | |
| {"current_steps": 1415, "total_steps": 3099, "loss": 0.0715, "lr": 3.303543108687364e-05, "epoch": 1.369841461938763, "percentage": 45.66, "elapsed_time": "1 day, 15:23:26", "remaining_time": "1 day, 22:52:44", "throughput": 3758.91, "total_tokens": 533037392} | |
| {"current_steps": 1420, "total_steps": 3099, "loss": 0.0687, "lr": 3.290197284703707e-05, "epoch": 1.3746823187704225, "percentage": 45.82, "elapsed_time": "1 day, 15:30:42", "remaining_time": "1 day, 22:43:07", "throughput": 3761.77, "total_tokens": 535085280} | |
| {"current_steps": 1425, "total_steps": 3099, "loss": 0.0728, "lr": 3.276826395177438e-05, "epoch": 1.3795231756020816, "percentage": 45.98, "elapsed_time": "1 day, 15:35:31", "remaining_time": "1 day, 22:30:36", "throughput": 3767.35, "total_tokens": 536966576} | |
| {"current_steps": 1430, "total_steps": 3099, "loss": 0.068, "lr": 3.263430864241376e-05, "epoch": 1.3843640324337407, "percentage": 46.14, "elapsed_time": "1 day, 15:40:54", "remaining_time": "1 day, 22:18:50", "throughput": 3771.87, "total_tokens": 538829216} | |
| {"current_steps": 1435, "total_steps": 3099, "loss": 0.0678, "lr": 3.250011116809978e-05, "epoch": 1.3892048892653999, "percentage": 46.31, "elapsed_time": "1 day, 15:46:01", "remaining_time": "1 day, 22:06:47", "throughput": 3776.39, "total_tokens": 540632144} | |
| {"current_steps": 1440, "total_steps": 3099, "loss": 0.0693, "lr": 3.236567578565867e-05, "epoch": 1.3940457460970592, "percentage": 46.47, "elapsed_time": "1 day, 15:50:20", "remaining_time": "1 day, 21:53:51", "throughput": 3782.12, "total_tokens": 542432288} | |
| {"current_steps": 1445, "total_steps": 3099, "loss": 0.0655, "lr": 3.223100675946321e-05, "epoch": 1.3988866029287184, "percentage": 46.63, "elapsed_time": "1 day, 15:56:48", "remaining_time": "1 day, 21:43:28", "throughput": 3785.61, "total_tokens": 544403440} | |
| {"current_steps": 1450, "total_steps": 3099, "loss": 0.0657, "lr": 3.209610836129755e-05, "epoch": 1.4037274597603777, "percentage": 46.79, "elapsed_time": "1 day, 16:00:56", "remaining_time": "1 day, 21:30:27", "throughput": 3791.51, "total_tokens": 546192304} | |
| {"current_steps": 1455, "total_steps": 3099, "loss": 0.065, "lr": 3.1960984870221596e-05, "epoch": 1.4085683165920369, "percentage": 46.95, "elapsed_time": "1 day, 16:05:34", "remaining_time": "1 day, 21:18:02", "throughput": 3796.96, "total_tokens": 548030912} | |
| {"current_steps": 1460, "total_steps": 3099, "loss": 0.067, "lr": 3.1825640572435394e-05, "epoch": 1.413409173423696, "percentage": 47.11, "elapsed_time": "1 day, 16:10:47", "remaining_time": "1 day, 21:06:21", "throughput": 3802.14, "total_tokens": 549968368} | |
| {"current_steps": 1465, "total_steps": 3099, "loss": 0.0633, "lr": 3.169007976114311e-05, "epoch": 1.4182500302553551, "percentage": 47.27, "elapsed_time": "1 day, 16:17:45", "remaining_time": "1 day, 20:56:40", "throughput": 3805.15, "total_tokens": 551997376} | |
| {"current_steps": 1470, "total_steps": 3099, "loss": 0.069, "lr": 3.155430673641681e-05, "epoch": 1.4230908870870145, "percentage": 47.43, "elapsed_time": "1 day, 16:22:30", "remaining_time": "1 day, 20:44:31", "throughput": 3810.22, "total_tokens": 553815552} | |
| {"current_steps": 1475, "total_steps": 3099, "loss": 0.0713, "lr": 3.1418325805060126e-05, "epoch": 1.4279317439186736, "percentage": 47.6, "elapsed_time": "1 day, 16:28:18", "remaining_time": "1 day, 20:33:36", "throughput": 3814.17, "total_tokens": 555719392} | |
| {"current_steps": 1480, "total_steps": 3099, "loss": 0.069, "lr": 3.1282141280471645e-05, "epoch": 1.4327726007503327, "percentage": 47.76, "elapsed_time": "1 day, 16:32:53", "remaining_time": "1 day, 20:21:23", "throughput": 3819.21, "total_tokens": 557504016} | |
| {"current_steps": 1485, "total_steps": 3099, "loss": 0.0678, "lr": 3.114575748250801e-05, "epoch": 1.437613457581992, "percentage": 47.92, "elapsed_time": "1 day, 16:38:47", "remaining_time": "1 day, 20:10:38", "throughput": 3823.29, "total_tokens": 559452496} | |
| {"current_steps": 1490, "total_steps": 3099, "loss": 0.0648, "lr": 3.100917873734696e-05, "epoch": 1.4424543144136512, "percentage": 48.08, "elapsed_time": "1 day, 16:44:15", "remaining_time": "1 day, 19:59:28", "throughput": 3827.59, "total_tokens": 561337136} | |
| {"current_steps": 1495, "total_steps": 3099, "loss": 0.0682, "lr": 3.087240937735008e-05, "epoch": 1.4472951712453104, "percentage": 48.24, "elapsed_time": "1 day, 16:49:12", "remaining_time": "1 day, 19:47:46", "throughput": 3832.78, "total_tokens": 563237008} | |
| {"current_steps": 1500, "total_steps": 3099, "loss": 0.07, "lr": 3.073545374092535e-05, "epoch": 1.4521360280769695, "percentage": 48.4, "elapsed_time": "1 day, 16:54:12", "remaining_time": "1 day, 19:36:10", "throughput": 3837.34, "total_tokens": 565056704} | |
| {"current_steps": 1505, "total_steps": 3099, "loss": 0.0653, "lr": 3.05983161723896e-05, "epoch": 1.4569768849086289, "percentage": 48.56, "elapsed_time": "1 day, 16:59:34", "remaining_time": "1 day, 19:25:01", "throughput": 3842.03, "total_tokens": 566984576} | |
| {"current_steps": 1510, "total_steps": 3099, "loss": 0.0664, "lr": 3.046100102183061e-05, "epoch": 1.461817741740288, "percentage": 48.73, "elapsed_time": "1 day, 17:04:49", "remaining_time": "1 day, 19:13:47", "throughput": 3847.0, "total_tokens": 568931872} | |
| {"current_steps": 1515, "total_steps": 3099, "loss": 0.0644, "lr": 3.0323512644969194e-05, "epoch": 1.4666585985719474, "percentage": 48.89, "elapsed_time": "1 day, 17:09:13", "remaining_time": "1 day, 19:01:40", "throughput": 3852.54, "total_tokens": 570766304} | |
| {"current_steps": 1520, "total_steps": 3099, "loss": 0.0697, "lr": 3.0185855403021013e-05, "epoch": 1.4714994554036065, "percentage": 49.05, "elapsed_time": "1 day, 17:14:49", "remaining_time": "1 day, 18:50:53", "throughput": 3856.78, "total_tokens": 572692384} | |
| {"current_steps": 1525, "total_steps": 3099, "loss": 0.0731, "lr": 3.0048033662558222e-05, "epoch": 1.4763403122352656, "percentage": 49.21, "elapsed_time": "1 day, 17:19:38", "remaining_time": "1 day, 18:39:18", "throughput": 3861.31, "total_tokens": 574478256} | |
| {"current_steps": 1530, "total_steps": 3099, "loss": 0.068, "lr": 2.9910051795370974e-05, "epoch": 1.4811811690669248, "percentage": 49.37, "elapsed_time": "1 day, 17:24:45", "remaining_time": "1 day, 18:28:05", "throughput": 3865.82, "total_tokens": 576337936} | |
| {"current_steps": 1535, "total_steps": 3099, "loss": 0.0663, "lr": 2.977191417832874e-05, "epoch": 1.4860220258985841, "percentage": 49.53, "elapsed_time": "1 day, 17:28:49", "remaining_time": "1 day, 18:15:51", "throughput": 3871.32, "total_tokens": 578104656} | |
| {"current_steps": 1540, "total_steps": 3099, "loss": 0.0674, "lr": 2.9633625193241475e-05, "epoch": 1.4908628827302433, "percentage": 49.69, "elapsed_time": "1 day, 17:33:40", "remaining_time": "1 day, 18:04:26", "throughput": 3876.17, "total_tokens": 579956016} | |
| {"current_steps": 1545, "total_steps": 3099, "loss": 0.0694, "lr": 2.9495189226720615e-05, "epoch": 1.4957037395619024, "percentage": 49.85, "elapsed_time": "1 day, 17:39:34", "remaining_time": "1 day, 17:54:08", "throughput": 3879.81, "total_tokens": 581873728} | |
| {"current_steps": 1550, "total_steps": 3099, "loss": 0.0689, "lr": 2.935661067003994e-05, "epoch": 1.5005445963935617, "percentage": 50.02, "elapsed_time": "1 day, 17:44:44", "remaining_time": "1 day, 17:43:07", "throughput": 3884.11, "total_tokens": 583722192} | |
| {"current_steps": 1555, "total_steps": 3099, "loss": 0.0711, "lr": 2.9217893918996285e-05, "epoch": 1.5053854532252209, "percentage": 50.18, "elapsed_time": "1 day, 17:49:34", "remaining_time": "1 day, 17:31:49", "throughput": 3888.65, "total_tokens": 585531280} | |
| {"current_steps": 1560, "total_steps": 3099, "loss": 0.0657, "lr": 2.9079043373770088e-05, "epoch": 1.51022631005688, "percentage": 50.34, "elapsed_time": "1 day, 17:55:16", "remaining_time": "1 day, 17:21:24", "throughput": 3892.66, "total_tokens": 587465120} | |
| {"current_steps": 1565, "total_steps": 3099, "loss": 0.065, "lr": 2.8940063438785808e-05, "epoch": 1.5150671668885392, "percentage": 50.5, "elapsed_time": "1 day, 18:00:32", "remaining_time": "1 day, 17:10:36", "throughput": 3896.73, "total_tokens": 589312272} | |
| {"current_steps": 1570, "total_steps": 3099, "loss": 0.0669, "lr": 2.8800958522572246e-05, "epoch": 1.5199080237201985, "percentage": 50.66, "elapsed_time": "1 day, 18:05:41", "remaining_time": "1 day, 16:59:44", "throughput": 3901.39, "total_tokens": 591224496} | |
| {"current_steps": 1575, "total_steps": 3099, "loss": 0.0703, "lr": 2.866173303762268e-05, "epoch": 1.5247488805518576, "percentage": 50.82, "elapsed_time": "1 day, 18:11:10", "remaining_time": "1 day, 16:49:12", "throughput": 3905.27, "total_tokens": 593094000} | |
| {"current_steps": 1580, "total_steps": 3099, "loss": 0.0678, "lr": 2.8522391400254887e-05, "epoch": 1.529589737383517, "percentage": 50.98, "elapsed_time": "1 day, 18:16:42", "remaining_time": "1 day, 16:38:45", "throughput": 3909.53, "total_tokens": 595038832} | |
| {"current_steps": 1585, "total_steps": 3099, "loss": 0.0697, "lr": 2.8382938030471112e-05, "epoch": 1.5344305942151761, "percentage": 51.15, "elapsed_time": "1 day, 18:20:52", "remaining_time": "1 day, 16:27:02", "throughput": 3914.84, "total_tokens": 596824960} | |
| {"current_steps": 1590, "total_steps": 3099, "loss": 0.0689, "lr": 2.8243377351817755e-05, "epoch": 1.5392714510468353, "percentage": 51.31, "elapsed_time": "1 day, 18:26:26", "remaining_time": "1 day, 16:16:43", "throughput": 3918.57, "total_tokens": 598705200} | |
| {"current_steps": 1595, "total_steps": 3099, "loss": 0.0612, "lr": 2.8103713791245178e-05, "epoch": 1.5441123078784944, "percentage": 51.47, "elapsed_time": "1 day, 18:31:34", "remaining_time": "1 day, 16:05:59", "throughput": 3923.07, "total_tokens": 600600592} | |
| {"current_steps": 1600, "total_steps": 3099, "loss": 0.0681, "lr": 2.7963951778967197e-05, "epoch": 1.5489531647101535, "percentage": 51.63, "elapsed_time": "1 day, 18:35:35", "remaining_time": "1 day, 15:54:16", "throughput": 3928.57, "total_tokens": 602389504} | |
| {"current_steps": 1605, "total_steps": 3099, "loss": 0.0697, "lr": 2.7824095748320568e-05, "epoch": 1.553794021541813, "percentage": 51.79, "elapsed_time": "1 day, 18:39:42", "remaining_time": "1 day, 15:42:40", "throughput": 3933.43, "total_tokens": 604104288} | |
| {"current_steps": 1610, "total_steps": 3099, "loss": 0.0701, "lr": 2.7684150135624376e-05, "epoch": 1.5586348783734723, "percentage": 51.95, "elapsed_time": "1 day, 18:44:40", "remaining_time": "1 day, 15:31:55", "throughput": 3937.81, "total_tokens": 605951504} | |
| {"current_steps": 1615, "total_steps": 3099, "loss": 0.0661, "lr": 2.7544119380039314e-05, "epoch": 1.5634757352051314, "percentage": 52.11, "elapsed_time": "1 day, 18:51:38", "remaining_time": "1 day, 15:23:02", "throughput": 3940.34, "total_tokens": 607990208} | |
| {"current_steps": 1620, "total_steps": 3099, "loss": 0.0699, "lr": 2.740400792342685e-05, "epoch": 1.5683165920367905, "percentage": 52.27, "elapsed_time": "1 day, 18:56:58", "remaining_time": "1 day, 15:12:41", "throughput": 3944.6, "total_tokens": 609909232} | |
| {"current_steps": 1625, "total_steps": 3099, "loss": 0.0718, "lr": 2.726382021020833e-05, "epoch": 1.5731574488684497, "percentage": 52.44, "elapsed_time": "1 day, 19:02:01", "remaining_time": "1 day, 15:02:05", "throughput": 3948.68, "total_tokens": 611736000} | |
| {"current_steps": 1630, "total_steps": 3099, "loss": 0.0665, "lr": 2.7123560687224013e-05, "epoch": 1.5779983057001088, "percentage": 52.6, "elapsed_time": "1 day, 19:06:47", "remaining_time": "1 day, 14:51:17", "throughput": 3953.15, "total_tokens": 613559536} | |
| {"current_steps": 1635, "total_steps": 3099, "loss": 0.0664, "lr": 2.6983233803592022e-05, "epoch": 1.5828391625317682, "percentage": 52.76, "elapsed_time": "1 day, 19:11:25", "remaining_time": "1 day, 14:40:23", "throughput": 3957.87, "total_tokens": 615391184} | |
| {"current_steps": 1640, "total_steps": 3099, "loss": 0.0734, "lr": 2.6842844010567177e-05, "epoch": 1.5876800193634273, "percentage": 52.92, "elapsed_time": "1 day, 19:17:37", "remaining_time": "1 day, 14:30:56", "throughput": 3960.7, "total_tokens": 617305296} | |
| {"current_steps": 1645, "total_steps": 3099, "loss": 0.0674, "lr": 2.6702395761399844e-05, "epoch": 1.5925208761950866, "percentage": 53.08, "elapsed_time": "1 day, 19:22:08", "remaining_time": "1 day, 14:20:00", "throughput": 3965.38, "total_tokens": 619107456} | |
| {"current_steps": 1650, "total_steps": 3099, "loss": 0.0705, "lr": 2.656189351119463e-05, "epoch": 1.5973617330267458, "percentage": 53.24, "elapsed_time": "1 day, 19:27:45", "remaining_time": "1 day, 14:10:05", "throughput": 3968.6, "total_tokens": 620950304} | |
| {"current_steps": 1655, "total_steps": 3099, "loss": 0.0692, "lr": 2.6421341716769112e-05, "epoch": 1.602202589858405, "percentage": 53.4, "elapsed_time": "1 day, 19:32:47", "remaining_time": "1 day, 13:59:40", "throughput": 3972.74, "total_tokens": 622796352} | |
| {"current_steps": 1660, "total_steps": 3099, "loss": 0.0666, "lr": 2.6280744836512423e-05, "epoch": 1.607043446690064, "percentage": 53.57, "elapsed_time": "1 day, 19:38:08", "remaining_time": "1 day, 13:49:34", "throughput": 3976.74, "total_tokens": 624698480} | |
| {"current_steps": 1665, "total_steps": 3099, "loss": 0.0696, "lr": 2.6140107330243858e-05, "epoch": 1.6118843035217232, "percentage": 53.73, "elapsed_time": "1 day, 19:43:00", "remaining_time": "1 day, 13:39:05", "throughput": 3980.97, "total_tokens": 626526800} | |
| {"current_steps": 1670, "total_steps": 3099, "loss": 0.0708, "lr": 2.599943365907138e-05, "epoch": 1.6167251603533825, "percentage": 53.89, "elapsed_time": "1 day, 19:47:33", "remaining_time": "1 day, 13:28:22", "throughput": 3985.59, "total_tokens": 628340752} | |
| {"current_steps": 1675, "total_steps": 3099, "loss": 0.0628, "lr": 2.5858728285250156e-05, "epoch": 1.621566017185042, "percentage": 54.05, "elapsed_time": "1 day, 19:53:13", "remaining_time": "1 day, 13:18:37", "throughput": 3989.38, "total_tokens": 630294736} | |
| {"current_steps": 1680, "total_steps": 3099, "loss": 0.0668, "lr": 2.5717995672040934e-05, "epoch": 1.626406874016701, "percentage": 54.21, "elapsed_time": "1 day, 19:58:25", "remaining_time": "1 day, 13:08:32", "throughput": 3993.41, "total_tokens": 632181360} | |
| {"current_steps": 1685, "total_steps": 3099, "loss": 0.0672, "lr": 2.5577240283568547e-05, "epoch": 1.6312477308483602, "percentage": 54.37, "elapsed_time": "1 day, 20:04:18", "remaining_time": "1 day, 12:59:01", "throughput": 3996.88, "total_tokens": 634139120} | |
| {"current_steps": 1690, "total_steps": 3099, "loss": 0.065, "lr": 2.5436466584680257e-05, "epoch": 1.6360885876800193, "percentage": 54.53, "elapsed_time": "1 day, 20:09:55", "remaining_time": "1 day, 12:49:19", "throughput": 4000.49, "total_tokens": 636061136} | |
| {"current_steps": 1695, "total_steps": 3099, "loss": 0.0679, "lr": 2.529567904080416e-05, "epoch": 1.6409294445116784, "percentage": 54.7, "elapsed_time": "1 day, 20:14:59", "remaining_time": "1 day, 12:39:10", "throughput": 4004.42, "total_tokens": 637901488} | |
| {"current_steps": 1700, "total_steps": 3099, "loss": 0.0674, "lr": 2.5154882117807503e-05, "epoch": 1.6457703013433378, "percentage": 54.86, "elapsed_time": "1 day, 20:20:40", "remaining_time": "1 day, 12:29:35", "throughput": 4007.64, "total_tokens": 639783152} | |
| {"current_steps": 1705, "total_steps": 3099, "loss": 0.0718, "lr": 2.5014080281855062e-05, "epoch": 1.650611158174997, "percentage": 55.02, "elapsed_time": "1 day, 20:25:48", "remaining_time": "1 day, 12:19:32", "throughput": 4011.31, "total_tokens": 641601136} | |
| {"current_steps": 1710, "total_steps": 3099, "loss": 0.0682, "lr": 2.4873277999267443e-05, "epoch": 1.6554520150066563, "percentage": 55.18, "elapsed_time": "1 day, 20:30:28", "remaining_time": "1 day, 12:09:10", "throughput": 4015.93, "total_tokens": 643464448} | |
| {"current_steps": 1715, "total_steps": 3099, "loss": 0.0668, "lr": 2.473247973637942e-05, "epoch": 1.6602928718383154, "percentage": 55.34, "elapsed_time": "1 day, 20:36:12", "remaining_time": "1 day, 11:59:41", "throughput": 4019.38, "total_tokens": 645403984} | |
| {"current_steps": 1720, "total_steps": 3099, "loss": 0.063, "lr": 2.459168995939827e-05, "epoch": 1.6651337286699746, "percentage": 55.5, "elapsed_time": "1 day, 20:41:56", "remaining_time": "1 day, 11:50:13", "throughput": 4022.96, "total_tokens": 647359520} | |
| {"current_steps": 1725, "total_steps": 3099, "loss": 0.0698, "lr": 2.4450913134262077e-05, "epoch": 1.6699745855016337, "percentage": 55.66, "elapsed_time": "1 day, 20:46:51", "remaining_time": "1 day, 11:40:08", "throughput": 4027.13, "total_tokens": 649221056} | |
| {"current_steps": 1730, "total_steps": 3099, "loss": 0.0713, "lr": 2.4310153726498107e-05, "epoch": 1.674815442333293, "percentage": 55.82, "elapsed_time": "1 day, 20:52:47", "remaining_time": "1 day, 11:30:52", "throughput": 4029.74, "total_tokens": 651074128} | |
| {"current_steps": 1735, "total_steps": 3099, "loss": 0.0697, "lr": 2.4169416201081102e-05, "epoch": 1.6796562991649522, "percentage": 55.99, "elapsed_time": "1 day, 20:59:02", "remaining_time": "1 day, 11:21:53", "throughput": 4032.17, "total_tokens": 652978208} | |
| {"current_steps": 1740, "total_steps": 3099, "loss": 0.0661, "lr": 2.4028705022291728e-05, "epoch": 1.6844971559966115, "percentage": 56.15, "elapsed_time": "1 day, 21:05:00", "remaining_time": "1 day, 11:12:42", "throughput": 4035.18, "total_tokens": 654910336} | |
| {"current_steps": 1745, "total_steps": 3099, "loss": 0.0654, "lr": 2.3888024653574865e-05, "epoch": 1.6893380128282707, "percentage": 56.31, "elapsed_time": "1 day, 21:10:32", "remaining_time": "1 day, 11:03:11", "throughput": 4038.77, "total_tokens": 656834320} | |
| {"current_steps": 1750, "total_steps": 3099, "loss": 0.0675, "lr": 2.374737955739814e-05, "epoch": 1.6941788696599298, "percentage": 56.47, "elapsed_time": "1 day, 21:16:17", "remaining_time": "1 day, 10:53:52", "throughput": 4041.95, "total_tokens": 658744624} | |
| {"current_steps": 1755, "total_steps": 3099, "loss": 0.0688, "lr": 2.3606774195110256e-05, "epoch": 1.699019726491589, "percentage": 56.63, "elapsed_time": "1 day, 21:21:50", "remaining_time": "1 day, 10:44:25", "throughput": 4045.4, "total_tokens": 660657152} | |
| {"current_steps": 1760, "total_steps": 3099, "loss": 0.0626, "lr": 2.346621302679957e-05, "epoch": 1.703860583323248, "percentage": 56.79, "elapsed_time": "1 day, 21:27:29", "remaining_time": "1 day, 10:35:03", "throughput": 4049.01, "total_tokens": 662618160} | |
| {"current_steps": 1765, "total_steps": 3099, "loss": 0.0688, "lr": 2.3325700511152572e-05, "epoch": 1.7087014401549074, "percentage": 56.95, "elapsed_time": "1 day, 21:33:00", "remaining_time": "1 day, 10:25:37", "throughput": 4052.11, "total_tokens": 664466176} | |
| {"current_steps": 1770, "total_steps": 3099, "loss": 0.0644, "lr": 2.3185241105312435e-05, "epoch": 1.7135422969865666, "percentage": 57.12, "elapsed_time": "1 day, 21:37:37", "remaining_time": "1 day, 10:15:32", "throughput": 4056.45, "total_tokens": 666303008} | |
| {"current_steps": 1775, "total_steps": 3099, "loss": 0.0654, "lr": 2.3044839264737695e-05, "epoch": 1.718383153818226, "percentage": 57.28, "elapsed_time": "1 day, 21:43:26", "remaining_time": "1 day, 10:06:22", "throughput": 4059.69, "total_tokens": 668249808} | |
| {"current_steps": 1780, "total_steps": 3099, "loss": 0.0618, "lr": 2.2904499443060852e-05, "epoch": 1.723224010649885, "percentage": 57.44, "elapsed_time": "1 day, 21:48:35", "remaining_time": "1 day, 9:56:44", "throughput": 4063.54, "total_tokens": 670142528} | |
| {"current_steps": 1785, "total_steps": 3099, "loss": 0.0705, "lr": 2.2764226091947153e-05, "epoch": 1.7280648674815442, "percentage": 57.6, "elapsed_time": "1 day, 21:53:24", "remaining_time": "1 day, 9:46:52", "throughput": 4067.04, "total_tokens": 671892176} | |
| {"current_steps": 1790, "total_steps": 3099, "loss": 0.0694, "lr": 2.2624023660953322e-05, "epoch": 1.7329057243132033, "percentage": 57.76, "elapsed_time": "1 day, 21:59:15", "remaining_time": "1 day, 9:37:48", "throughput": 4069.89, "total_tokens": 673790848} | |
| {"current_steps": 1795, "total_steps": 3099, "loss": 0.0672, "lr": 2.2483896597386506e-05, "epoch": 1.7377465811448627, "percentage": 57.92, "elapsed_time": "1 day, 22:05:25", "remaining_time": "1 day, 9:28:58", "throughput": 4072.7, "total_tokens": 675763984} | |
| {"current_steps": 1800, "total_steps": 3099, "loss": 0.0664, "lr": 2.2343849346163092e-05, "epoch": 1.7425874379765218, "percentage": 58.08, "elapsed_time": "1 day, 22:10:41", "remaining_time": "1 day, 9:19:30", "throughput": 4076.52, "total_tokens": 677686256} | |
| {"current_steps": 1805, "total_steps": 3099, "loss": 0.067, "lr": 2.2203886349667826e-05, "epoch": 1.7474282948081812, "percentage": 58.24, "elapsed_time": "1 day, 22:15:28", "remaining_time": "1 day, 9:09:43", "throughput": 4080.67, "total_tokens": 679548000} | |
| {"current_steps": 1810, "total_steps": 3099, "loss": 0.0674, "lr": 2.2064012047612796e-05, "epoch": 1.7522691516398403, "percentage": 58.41, "elapsed_time": "1 day, 22:19:23", "remaining_time": "1 day, 8:59:21", "throughput": 4085.56, "total_tokens": 681323824} | |
| {"current_steps": 1815, "total_steps": 3099, "loss": 0.0639, "lr": 2.1924230876896684e-05, "epoch": 1.7571100084714995, "percentage": 58.57, "elapsed_time": "1 day, 22:25:14", "remaining_time": "1 day, 8:50:23", "throughput": 4088.74, "total_tokens": 683289152} | |
| {"current_steps": 1820, "total_steps": 3099, "loss": 0.063, "lr": 2.1784547271463966e-05, "epoch": 1.7619508653031586, "percentage": 58.73, "elapsed_time": "1 day, 22:31:00", "remaining_time": "1 day, 8:41:22", "throughput": 4092.0, "total_tokens": 685248960} | |
| {"current_steps": 1825, "total_steps": 3099, "loss": 0.0658, "lr": 2.164496566216428e-05, "epoch": 1.7667917221348177, "percentage": 58.89, "elapsed_time": "1 day, 22:35:27", "remaining_time": "1 day, 8:31:27", "throughput": 4096.37, "total_tokens": 687075264} | |
| {"current_steps": 1830, "total_steps": 3099, "loss": 0.0706, "lr": 2.150549047661193e-05, "epoch": 1.771632578966477, "percentage": 59.05, "elapsed_time": "1 day, 22:40:40", "remaining_time": "1 day, 8:22:06", "throughput": 4099.78, "total_tokens": 688930992} | |
| {"current_steps": 1835, "total_steps": 3099, "loss": 0.0633, "lr": 2.136612613904533e-05, "epoch": 1.7764734357981364, "percentage": 59.21, "elapsed_time": "1 day, 22:44:58", "remaining_time": "1 day, 8:12:09", "throughput": 4104.22, "total_tokens": 690736016} | |
| {"current_steps": 1840, "total_steps": 3099, "loss": 0.068, "lr": 2.1226877070186782e-05, "epoch": 1.7813142926297956, "percentage": 59.37, "elapsed_time": "1 day, 22:50:36", "remaining_time": "1 day, 8:03:07", "throughput": 4107.48, "total_tokens": 692670496} | |
| {"current_steps": 1845, "total_steps": 3099, "loss": 0.0643, "lr": 2.108774768710215e-05, "epoch": 1.7861551494614547, "percentage": 59.54, "elapsed_time": "1 day, 22:56:19", "remaining_time": "1 day, 7:54:11", "throughput": 4110.64, "total_tokens": 694613552} | |
| {"current_steps": 1850, "total_steps": 3099, "loss": 0.0667, "lr": 2.0948742403060838e-05, "epoch": 1.7909960062931138, "percentage": 59.7, "elapsed_time": "1 day, 23:01:19", "remaining_time": "1 day, 7:44:46", "throughput": 4114.3, "total_tokens": 696469216} | |
| {"current_steps": 1855, "total_steps": 3099, "loss": 0.0681, "lr": 2.0809865627395705e-05, "epoch": 1.795836863124773, "percentage": 59.86, "elapsed_time": "1 day, 23:07:32", "remaining_time": "1 day, 7:36:12", "throughput": 4116.76, "total_tokens": 698418624} | |
| {"current_steps": 1860, "total_steps": 3099, "loss": 0.0647, "lr": 2.0671121765363288e-05, "epoch": 1.8006777199564323, "percentage": 60.02, "elapsed_time": "1 day, 23:14:03", "remaining_time": "1 day, 7:27:50", "throughput": 4118.86, "total_tokens": 700384480} | |
| {"current_steps": 1865, "total_steps": 3099, "loss": 0.0699, "lr": 2.0532515218003985e-05, "epoch": 1.8055185767880915, "percentage": 60.18, "elapsed_time": "1 day, 23:20:04", "remaining_time": "1 day, 7:19:09", "throughput": 4121.41, "total_tokens": 702304704} | |
| {"current_steps": 1870, "total_steps": 3099, "loss": 0.0691, "lr": 2.039405038200252e-05, "epoch": 1.8103594336197508, "percentage": 60.34, "elapsed_time": "1 day, 23:25:15", "remaining_time": "1 day, 7:09:57", "throughput": 4124.97, "total_tokens": 704195280} | |
| {"current_steps": 1875, "total_steps": 3099, "loss": 0.0656, "lr": 2.0255731649548427e-05, "epoch": 1.81520029045141, "percentage": 60.5, "elapsed_time": "1 day, 23:30:32", "remaining_time": "1 day, 7:00:50", "throughput": 4128.21, "total_tokens": 706059712} | |
| {"current_steps": 1880, "total_steps": 3099, "loss": 0.0649, "lr": 2.011756340819673e-05, "epoch": 1.820041147283069, "percentage": 60.66, "elapsed_time": "1 day, 23:37:00", "remaining_time": "1 day, 6:52:29", "throughput": 4130.49, "total_tokens": 708049376} | |
| {"current_steps": 1885, "total_steps": 3099, "loss": 0.0677, "lr": 1.9979550040728838e-05, "epoch": 1.8248820041147282, "percentage": 60.83, "elapsed_time": "1 day, 23:42:31", "remaining_time": "1 day, 6:43:33", "throughput": 4133.64, "total_tokens": 709957648} | |
| {"current_steps": 1890, "total_steps": 3099, "loss": 0.0666, "lr": 1.9841695925013406e-05, "epoch": 1.8297228609463874, "percentage": 60.99, "elapsed_time": "1 day, 23:47:25", "remaining_time": "1 day, 6:34:14", "throughput": 4137.14, "total_tokens": 711775040} | |
| {"current_steps": 1895, "total_steps": 3099, "loss": 0.0652, "lr": 1.9704005433867555e-05, "epoch": 1.8345637177780467, "percentage": 61.15, "elapsed_time": "1 day, 23:52:43", "remaining_time": "1 day, 6:25:12", "throughput": 4140.48, "total_tokens": 713667296} | |
| {"current_steps": 1900, "total_steps": 3099, "loss": 0.0653, "lr": 1.9566482934918135e-05, "epoch": 1.839404574609706, "percentage": 61.31, "elapsed_time": "1 day, 23:57:59", "remaining_time": "1 day, 6:16:09", "throughput": 4143.93, "total_tokens": 715572784} | |
| {"current_steps": 1905, "total_steps": 3099, "loss": 0.0623, "lr": 1.9429132790463172e-05, "epoch": 1.8442454314413652, "percentage": 61.47, "elapsed_time": "2 days, 0:02:31", "remaining_time": "1 day, 6:06:41", "throughput": 4147.99, "total_tokens": 717403184} | |
| {"current_steps": 1910, "total_steps": 3099, "loss": 0.0652, "lr": 1.9291959357333495e-05, "epoch": 1.8490862882730243, "percentage": 61.63, "elapsed_time": "2 days, 0:06:58", "remaining_time": "1 day, 5:57:10", "throughput": 4151.93, "total_tokens": 719188672} | |
| {"current_steps": 1915, "total_steps": 3099, "loss": 0.0656, "lr": 1.9154966986754568e-05, "epoch": 1.8539271451046835, "percentage": 61.79, "elapsed_time": "2 days, 0:12:48", "remaining_time": "1 day, 5:48:33", "throughput": 4154.8, "total_tokens": 721142368} | |
| {"current_steps": 1920, "total_steps": 3099, "loss": 0.0673, "lr": 1.9018160024208406e-05, "epoch": 1.8587680019363426, "percentage": 61.96, "elapsed_time": "2 days, 0:17:18", "remaining_time": "1 day, 5:39:07", "throughput": 4158.7, "total_tokens": 722942560} | |
| {"current_steps": 1925, "total_steps": 3099, "loss": 0.0659, "lr": 1.8881542809295804e-05, "epoch": 1.863608858768002, "percentage": 62.12, "elapsed_time": "2 days, 0:22:47", "remaining_time": "1 day, 5:30:19", "throughput": 4161.8, "total_tokens": 724852000} | |
| {"current_steps": 1930, "total_steps": 3099, "loss": 0.0635, "lr": 1.874511967559861e-05, "epoch": 1.868449715599661, "percentage": 62.28, "elapsed_time": "2 days, 0:27:37", "remaining_time": "1 day, 5:21:08", "throughput": 4165.59, "total_tokens": 726715728} | |
| {"current_steps": 1935, "total_steps": 3099, "loss": 0.0675, "lr": 1.860889495054231e-05, "epoch": 1.8732905724313205, "percentage": 62.44, "elapsed_time": "2 days, 0:32:20", "remaining_time": "1 day, 5:11:55", "throughput": 4169.32, "total_tokens": 728548704} | |
| {"current_steps": 1940, "total_steps": 3099, "loss": 0.065, "lr": 1.8472872955258764e-05, "epoch": 1.8781314292629796, "percentage": 62.6, "elapsed_time": "2 days, 0:37:48", "remaining_time": "1 day, 5:03:09", "throughput": 4172.41, "total_tokens": 730456800} | |
| {"current_steps": 1945, "total_steps": 3099, "loss": 0.066, "lr": 1.8337058004449087e-05, "epoch": 1.8829722860946387, "percentage": 62.76, "elapsed_time": "2 days, 0:42:53", "remaining_time": "1 day, 4:54:12", "throughput": 4175.63, "total_tokens": 732296016} | |
| {"current_steps": 1950, "total_steps": 3099, "loss": 0.0651, "lr": 1.8201454406246853e-05, "epoch": 1.8878131429262979, "percentage": 62.92, "elapsed_time": "2 days, 0:48:59", "remaining_time": "1 day, 4:45:51", "throughput": 4178.11, "total_tokens": 734259984} | |
| {"current_steps": 1955, "total_steps": 3099, "loss": 0.0626, "lr": 1.8066066462081365e-05, "epoch": 1.892653999757957, "percentage": 63.08, "elapsed_time": "2 days, 0:54:12", "remaining_time": "1 day, 4:36:59", "throughput": 4181.34, "total_tokens": 736134608} | |
| {"current_steps": 1960, "total_steps": 3099, "loss": 0.0643, "lr": 1.7930898466541278e-05, "epoch": 1.8974948565896164, "percentage": 63.25, "elapsed_time": "2 days, 0:59:08", "remaining_time": "1 day, 4:28:00", "throughput": 4184.61, "total_tokens": 737950480} | |
| {"current_steps": 1965, "total_steps": 3099, "loss": 0.0615, "lr": 1.779595470723831e-05, "epoch": 1.9023357134212757, "percentage": 63.41, "elapsed_time": "2 days, 1:04:07", "remaining_time": "1 day, 4:19:03", "throughput": 4188.21, "total_tokens": 739837152} | |
| {"current_steps": 1970, "total_steps": 3099, "loss": 0.0665, "lr": 1.7661239464671307e-05, "epoch": 1.9071765702529349, "percentage": 63.57, "elapsed_time": "2 days, 1:09:25", "remaining_time": "1 day, 4:10:18", "throughput": 4191.34, "total_tokens": 741721280} | |
| {"current_steps": 1975, "total_steps": 3099, "loss": 0.0651, "lr": 1.7526757012090384e-05, "epoch": 1.912017427084594, "percentage": 63.73, "elapsed_time": "2 days, 1:14:28", "remaining_time": "1 day, 4:01:25", "throughput": 4194.6, "total_tokens": 743570432} | |
| {"current_steps": 1980, "total_steps": 3099, "loss": 0.0651, "lr": 1.7392511615361454e-05, "epoch": 1.9168582839162531, "percentage": 63.89, "elapsed_time": "2 days, 1:18:52", "remaining_time": "1 day, 3:52:12", "throughput": 4198.3, "total_tokens": 745332208} | |
| {"current_steps": 1985, "total_steps": 3099, "loss": 0.0648, "lr": 1.7258507532830843e-05, "epoch": 1.9216991407479123, "percentage": 64.05, "elapsed_time": "2 days, 1:24:58", "remaining_time": "1 day, 3:43:58", "throughput": 4200.81, "total_tokens": 747317616} | |
| {"current_steps": 1990, "total_steps": 3099, "loss": 0.0646, "lr": 1.7124749015190245e-05, "epoch": 1.9265399975795716, "percentage": 64.21, "elapsed_time": "2 days, 1:29:58", "remaining_time": "1 day, 3:35:07", "throughput": 4204.2, "total_tokens": 749180048} | |
| {"current_steps": 1995, "total_steps": 3099, "loss": 0.0629, "lr": 1.699124030534191e-05, "epoch": 1.9313808544112308, "percentage": 64.38, "elapsed_time": "2 days, 1:34:53", "remaining_time": "1 day, 3:26:15", "throughput": 4207.65, "total_tokens": 751039536} | |
| {"current_steps": 2000, "total_steps": 3099, "loss": 0.0669, "lr": 1.6857985638263994e-05, "epoch": 1.93622171124289, "percentage": 64.54, "elapsed_time": "2 days, 1:39:33", "remaining_time": "1 day, 3:17:15", "throughput": 4211.54, "total_tokens": 752911840} | |
| {"current_steps": 2005, "total_steps": 3099, "loss": 0.0633, "lr": 1.6724989240876302e-05, "epoch": 1.9410625680745492, "percentage": 64.7, "elapsed_time": "2 days, 1:44:24", "remaining_time": "1 day, 3:08:23", "throughput": 4215.16, "total_tokens": 754784096} | |
| {"current_steps": 2010, "total_steps": 3099, "loss": 0.0631, "lr": 1.6592255331906127e-05, "epoch": 1.9459034249062084, "percentage": 64.86, "elapsed_time": "2 days, 1:49:42", "remaining_time": "1 day, 2:59:47", "throughput": 4218.07, "total_tokens": 756649472} | |
| {"current_steps": 2015, "total_steps": 3099, "loss": 0.0611, "lr": 1.64597881217545e-05, "epoch": 1.9507442817378675, "percentage": 65.02, "elapsed_time": "2 days, 1:54:41", "remaining_time": "1 day, 2:51:02", "throughput": 4221.56, "total_tokens": 758536336} | |
| {"current_steps": 2020, "total_steps": 3099, "loss": 0.0653, "lr": 1.632759181236258e-05, "epoch": 1.9555851385695266, "percentage": 65.18, "elapsed_time": "2 days, 1:59:49", "remaining_time": "1 day, 2:42:22", "throughput": 4224.58, "total_tokens": 760377888} | |
| {"current_steps": 2025, "total_steps": 3099, "loss": 0.0674, "lr": 1.61956705970784e-05, "epoch": 1.960425995401186, "percentage": 65.34, "elapsed_time": "2 days, 2:05:38", "remaining_time": "1 day, 2:34:05", "throughput": 4226.94, "total_tokens": 762278528} | |
| {"current_steps": 2030, "total_steps": 3099, "loss": 0.0666, "lr": 1.606402866052382e-05, "epoch": 1.9652668522328454, "percentage": 65.51, "elapsed_time": "2 days, 2:10:00", "remaining_time": "1 day, 2:25:04", "throughput": 4230.67, "total_tokens": 764061840} | |
| {"current_steps": 2035, "total_steps": 3099, "loss": 0.0652, "lr": 1.593267017846185e-05, "epoch": 1.9701077090645045, "percentage": 65.67, "elapsed_time": "2 days, 2:15:37", "remaining_time": "1 day, 2:16:43", "throughput": 4233.47, "total_tokens": 765994112} | |
| {"current_steps": 2040, "total_steps": 3099, "loss": 0.0655, "lr": 1.5801599317664106e-05, "epoch": 1.9749485658961636, "percentage": 65.83, "elapsed_time": "2 days, 2:20:45", "remaining_time": "1 day, 2:08:07", "throughput": 4236.65, "total_tokens": 767872592} | |
| {"current_steps": 2045, "total_steps": 3099, "loss": 0.0643, "lr": 1.567082023577869e-05, "epoch": 1.9797894227278228, "percentage": 65.99, "elapsed_time": "2 days, 2:26:10", "remaining_time": "1 day, 1:59:41", "throughput": 4239.42, "total_tokens": 769751856} | |
| {"current_steps": 2050, "total_steps": 3099, "loss": 0.0614, "lr": 1.554033708119832e-05, "epoch": 1.984630279559482, "percentage": 66.15, "elapsed_time": "2 days, 2:31:15", "remaining_time": "1 day, 1:51:06", "throughput": 4242.81, "total_tokens": 771662720} | |
| {"current_steps": 2055, "total_steps": 3099, "loss": 0.0637, "lr": 1.5410153992928685e-05, "epoch": 1.9894711363911413, "percentage": 66.31, "elapsed_time": "2 days, 2:36:43", "remaining_time": "1 day, 1:42:44", "throughput": 4245.46, "total_tokens": 773536048} | |
| {"current_steps": 2060, "total_steps": 3099, "loss": 0.0647, "lr": 1.528027510045723e-05, "epoch": 1.9943119932228004, "percentage": 66.47, "elapsed_time": "2 days, 2:42:05", "remaining_time": "1 day, 1:34:20", "throughput": 4248.45, "total_tokens": 775448176} | |
| {"current_steps": 2065, "total_steps": 3099, "loss": 0.0633, "lr": 1.5150704523622066e-05, "epoch": 1.9991528500544598, "percentage": 66.63, "elapsed_time": "2 days, 2:46:59", "remaining_time": "1 day, 1:25:42", "throughput": 4251.93, "total_tokens": 777334320} | |
| {"current_steps": 2070, "total_steps": 3099, "loss": 0.0456, "lr": 1.5021446372481408e-05, "epoch": 2.0038726854653275, "percentage": 66.8, "elapsed_time": "2 days, 2:53:22", "remaining_time": "1 day, 1:17:50", "throughput": 4253.6, "total_tokens": 779269280} | |
| {"current_steps": 2075, "total_steps": 3099, "loss": 0.0469, "lr": 1.4892504747183078e-05, "epoch": 2.0087135422969866, "percentage": 66.96, "elapsed_time": "2 days, 2:58:12", "remaining_time": "1 day, 1:09:12", "throughput": 4256.91, "total_tokens": 781110080} | |
| {"current_steps": 2080, "total_steps": 3099, "loss": 0.0424, "lr": 1.4763883737834538e-05, "epoch": 2.0135543991286458, "percentage": 67.12, "elapsed_time": "2 days, 3:03:35", "remaining_time": "1 day, 1:00:51", "throughput": 4259.79, "total_tokens": 783014480} | |
| {"current_steps": 2085, "total_steps": 3099, "loss": 0.0432, "lr": 1.4635587424373104e-05, "epoch": 2.018395255960305, "percentage": 67.28, "elapsed_time": "2 days, 3:08:25", "remaining_time": "1 day, 0:52:16", "throughput": 4263.41, "total_tokens": 784918160} | |
| {"current_steps": 2090, "total_steps": 3099, "loss": 0.0417, "lr": 1.4507619876436548e-05, "epoch": 2.023236112791964, "percentage": 67.44, "elapsed_time": "2 days, 3:14:27", "remaining_time": "1 day, 0:44:16", "throughput": 4265.94, "total_tokens": 786925872} | |
| {"current_steps": 2095, "total_steps": 3099, "loss": 0.0427, "lr": 1.4379985153233983e-05, "epoch": 2.0280769696236236, "percentage": 67.6, "elapsed_time": "2 days, 3:20:54", "remaining_time": "1 day, 0:36:29", "throughput": 4267.59, "total_tokens": 788883568} | |
| {"current_steps": 2100, "total_steps": 3099, "loss": 0.0447, "lr": 1.4252687303417125e-05, "epoch": 2.0329178264552827, "percentage": 67.76, "elapsed_time": "2 days, 3:27:01", "remaining_time": "1 day, 0:28:32", "throughput": 4269.67, "total_tokens": 790834704} | |
| {"current_steps": 2105, "total_steps": 3099, "loss": 0.044, "lr": 1.4125730364951867e-05, "epoch": 2.037758683286942, "percentage": 67.93, "elapsed_time": "2 days, 3:31:30", "remaining_time": "1 day, 0:19:50", "throughput": 4273.25, "total_tokens": 792644976} | |
| {"current_steps": 2110, "total_steps": 3099, "loss": 0.0432, "lr": 1.3999118364990172e-05, "epoch": 2.042599540118601, "percentage": 68.09, "elapsed_time": "2 days, 3:36:53", "remaining_time": "1 day, 0:11:34", "throughput": 4275.9, "total_tokens": 794521776} | |
| {"current_steps": 2115, "total_steps": 3099, "loss": 0.0465, "lr": 1.387285531974235e-05, "epoch": 2.04744039695026, "percentage": 68.25, "elapsed_time": "2 days, 3:41:33", "remaining_time": "1 day, 0:02:59", "throughput": 4279.17, "total_tokens": 796324144} | |
| {"current_steps": 2120, "total_steps": 3099, "loss": 0.042, "lr": 1.3746945234349651e-05, "epoch": 2.0522812537819193, "percentage": 68.41, "elapsed_time": "2 days, 3:46:20", "remaining_time": "23:54:29", "throughput": 4282.51, "total_tokens": 798176336} | |
| {"current_steps": 2125, "total_steps": 3099, "loss": 0.0454, "lr": 1.3621392102757236e-05, "epoch": 2.0571221106135784, "percentage": 68.57, "elapsed_time": "2 days, 3:51:27", "remaining_time": "23:46:08", "throughput": 4285.13, "total_tokens": 799981648} | |
| {"current_steps": 2130, "total_steps": 3099, "loss": 0.0447, "lr": 1.3496199907587426e-05, "epoch": 2.061962967445238, "percentage": 68.73, "elapsed_time": "2 days, 3:57:06", "remaining_time": "23:38:03", "throughput": 4287.73, "total_tokens": 801919920} | |
| {"current_steps": 2135, "total_steps": 3099, "loss": 0.0422, "lr": 1.337137262001349e-05, "epoch": 2.066803824276897, "percentage": 68.89, "elapsed_time": "2 days, 4:02:50", "remaining_time": "23:30:02", "throughput": 4290.05, "total_tokens": 803830048} | |
| {"current_steps": 2140, "total_steps": 3099, "loss": 0.0414, "lr": 1.324691419963352e-05, "epoch": 2.0716446811085563, "percentage": 69.05, "elapsed_time": "2 days, 4:07:37", "remaining_time": "23:21:35", "throughput": 4293.49, "total_tokens": 805707856} | |
| {"current_steps": 2145, "total_steps": 3099, "loss": 0.0445, "lr": 1.3122828594345007e-05, "epoch": 2.0764855379402154, "percentage": 69.22, "elapsed_time": "2 days, 4:13:09", "remaining_time": "23:13:29", "throughput": 4296.12, "total_tokens": 807627408} | |
| {"current_steps": 2150, "total_steps": 3099, "loss": 0.0462, "lr": 1.2999119740219434e-05, "epoch": 2.0813263947718745, "percentage": 69.38, "elapsed_time": "2 days, 4:17:54", "remaining_time": "23:05:03", "throughput": 4299.59, "total_tokens": 809504384} | |
| {"current_steps": 2155, "total_steps": 3099, "loss": 0.0458, "lr": 1.2875791561377557e-05, "epoch": 2.0861672516035337, "percentage": 69.54, "elapsed_time": "2 days, 4:23:18", "remaining_time": "22:56:55", "throughput": 4302.14, "total_tokens": 811379696} | |
| {"current_steps": 2160, "total_steps": 3099, "loss": 0.0425, "lr": 1.2752847969864857e-05, "epoch": 2.091008108435193, "percentage": 69.7, "elapsed_time": "2 days, 4:27:52", "remaining_time": "22:48:27", "throughput": 4305.37, "total_tokens": 813165728} | |
| {"current_steps": 2165, "total_steps": 3099, "loss": 0.0425, "lr": 1.2630292865527483e-05, "epoch": 2.0958489652668524, "percentage": 69.86, "elapsed_time": "2 days, 4:32:57", "remaining_time": "22:40:12", "throughput": 4308.55, "total_tokens": 815080720} | |
| {"current_steps": 2170, "total_steps": 3099, "loss": 0.0425, "lr": 1.2508130135888518e-05, "epoch": 2.1006898220985115, "percentage": 70.02, "elapsed_time": "2 days, 4:40:29", "remaining_time": "22:33:02", "throughput": 4308.79, "total_tokens": 817073936} | |
| {"current_steps": 2175, "total_steps": 3099, "loss": 0.0415, "lr": 1.2386363656024691e-05, "epoch": 2.1055306789301707, "percentage": 70.18, "elapsed_time": "2 days, 4:45:48", "remaining_time": "22:24:55", "throughput": 4311.63, "total_tokens": 818989136} | |
| {"current_steps": 2180, "total_steps": 3099, "loss": 0.0425, "lr": 1.226499728844345e-05, "epoch": 2.11037153576183, "percentage": 70.35, "elapsed_time": "2 days, 4:52:13", "remaining_time": "22:17:17", "throughput": 4313.33, "total_tokens": 820972848} | |
| {"current_steps": 2185, "total_steps": 3099, "loss": 0.0398, "lr": 1.2144034882960392e-05, "epoch": 2.115212392593489, "percentage": 70.51, "elapsed_time": "2 days, 4:57:52", "remaining_time": "22:09:19", "throughput": 4315.81, "total_tokens": 822903904} | |
| {"current_steps": 2190, "total_steps": 3099, "loss": 0.0473, "lr": 1.2023480276577267e-05, "epoch": 2.120053249425148, "percentage": 70.67, "elapsed_time": "2 days, 5:03:46", "remaining_time": "22:01:29", "throughput": 4317.8, "total_tokens": 824814944} | |
| {"current_steps": 2195, "total_steps": 3099, "loss": 0.042, "lr": 1.1903337293360101e-05, "epoch": 2.1248941062568076, "percentage": 70.83, "elapsed_time": "2 days, 5:08:14", "remaining_time": "21:53:03", "throughput": 4321.36, "total_tokens": 826652352} | |
| {"current_steps": 2200, "total_steps": 3099, "loss": 0.0419, "lr": 1.1783609744318057e-05, "epoch": 2.1297349630884668, "percentage": 70.99, "elapsed_time": "2 days, 5:14:06", "remaining_time": "21:45:13", "throughput": 4323.51, "total_tokens": 828587888} | |
| {"current_steps": 2205, "total_steps": 3099, "loss": 0.0449, "lr": 1.1664301427282418e-05, "epoch": 2.134575819920126, "percentage": 71.15, "elapsed_time": "2 days, 5:18:38", "remaining_time": "21:36:51", "throughput": 4326.79, "total_tokens": 830391184} | |
| {"current_steps": 2210, "total_steps": 3099, "loss": 0.0476, "lr": 1.154541612678619e-05, "epoch": 2.139416676751785, "percentage": 71.31, "elapsed_time": "2 days, 5:24:06", "remaining_time": "21:28:53", "throughput": 4329.24, "total_tokens": 832282752} | |
| {"current_steps": 2215, "total_steps": 3099, "loss": 0.0457, "lr": 1.1426957613944039e-05, "epoch": 2.144257533583444, "percentage": 71.47, "elapsed_time": "2 days, 5:29:27", "remaining_time": "21:20:53", "throughput": 4331.66, "total_tokens": 834136992} | |
| {"current_steps": 2220, "total_steps": 3099, "loss": 0.0417, "lr": 1.1308929646332658e-05, "epoch": 2.1490983904151033, "percentage": 71.64, "elapsed_time": "2 days, 5:34:49", "remaining_time": "21:12:53", "throughput": 4334.36, "total_tokens": 836052320} | |
| {"current_steps": 2225, "total_steps": 3099, "loss": 0.0439, "lr": 1.1191335967871582e-05, "epoch": 2.153939247246763, "percentage": 71.8, "elapsed_time": "2 days, 5:39:28", "remaining_time": "21:04:38", "throughput": 4337.58, "total_tokens": 837885568} | |
| {"current_steps": 2230, "total_steps": 3099, "loss": 0.0448, "lr": 1.1074180308704429e-05, "epoch": 2.158780104078422, "percentage": 71.96, "elapsed_time": "2 days, 5:44:41", "remaining_time": "20:56:37", "throughput": 4340.39, "total_tokens": 839786048} | |
| {"current_steps": 2235, "total_steps": 3099, "loss": 0.0462, "lr": 1.0957466385080578e-05, "epoch": 2.163620960910081, "percentage": 72.12, "elapsed_time": "2 days, 5:49:36", "remaining_time": "20:48:29", "throughput": 4343.34, "total_tokens": 841636432} | |
| {"current_steps": 2240, "total_steps": 3099, "loss": 0.0435, "lr": 1.0841197899237282e-05, "epoch": 2.1684618177417403, "percentage": 72.28, "elapsed_time": "2 days, 5:55:30", "remaining_time": "20:40:45", "throughput": 4345.47, "total_tokens": 843588608} | |
| {"current_steps": 2245, "total_steps": 3099, "loss": 0.0435, "lr": 1.0725378539282246e-05, "epoch": 2.1733026745733994, "percentage": 72.44, "elapsed_time": "2 days, 6:01:04", "remaining_time": "20:32:54", "throughput": 4347.71, "total_tokens": 845476688} | |
| {"current_steps": 2250, "total_steps": 3099, "loss": 0.0426, "lr": 1.061001197907659e-05, "epoch": 2.1781435314050586, "percentage": 72.6, "elapsed_time": "2 days, 6:05:54", "remaining_time": "20:24:47", "throughput": 4350.82, "total_tokens": 847341792} | |
| {"current_steps": 2255, "total_steps": 3099, "loss": 0.0438, "lr": 1.0495101878118408e-05, "epoch": 2.1829843882367177, "percentage": 72.77, "elapsed_time": "2 days, 6:10:17", "remaining_time": "20:16:31", "throughput": 4354.17, "total_tokens": 849140496} | |
| {"current_steps": 2260, "total_steps": 3099, "loss": 0.0421, "lr": 1.0380651881426567e-05, "epoch": 2.1878252450683773, "percentage": 72.93, "elapsed_time": "2 days, 6:14:19", "remaining_time": "20:08:07", "throughput": 4358.01, "total_tokens": 850942480} | |
| {"current_steps": 2265, "total_steps": 3099, "loss": 0.0441, "lr": 1.0266665619425181e-05, "epoch": 2.1926661019000364, "percentage": 73.09, "elapsed_time": "2 days, 6:19:12", "remaining_time": "20:00:04", "throughput": 4360.72, "total_tokens": 852750800} | |
| {"current_steps": 2270, "total_steps": 3099, "loss": 0.0427, "lr": 1.0153146707828404e-05, "epoch": 2.1975069587316955, "percentage": 73.25, "elapsed_time": "2 days, 6:25:05", "remaining_time": "19:52:24", "throughput": 4362.84, "total_tokens": 854703456} | |
| {"current_steps": 2275, "total_steps": 3099, "loss": 0.0438, "lr": 1.004009874752575e-05, "epoch": 2.2023478155633547, "percentage": 73.41, "elapsed_time": "2 days, 6:31:19", "remaining_time": "19:44:52", "throughput": 4364.36, "total_tokens": 856635792} | |
| {"current_steps": 2280, "total_steps": 3099, "loss": 0.0435, "lr": 9.927525324467866e-06, "epoch": 2.207188672395014, "percentage": 73.57, "elapsed_time": "2 days, 6:37:10", "remaining_time": "19:37:11", "throughput": 4366.28, "total_tokens": 858544176} | |
| {"current_steps": 2285, "total_steps": 3099, "loss": 0.0412, "lr": 9.81543000955279e-06, "epoch": 2.212029529226673, "percentage": 73.73, "elapsed_time": "2 days, 6:42:06", "remaining_time": "19:29:12", "throughput": 4369.2, "total_tokens": 860409424} | |
| {"current_steps": 2290, "total_steps": 3099, "loss": 0.0415, "lr": 9.703816358512674e-06, "epoch": 2.2168703860583325, "percentage": 73.89, "elapsed_time": "2 days, 6:47:17", "remaining_time": "19:21:19", "throughput": 4371.98, "total_tokens": 862320048} | |
| {"current_steps": 2295, "total_steps": 3099, "loss": 0.0442, "lr": 9.592687911801001e-06, "epoch": 2.2217112428899917, "percentage": 74.06, "elapsed_time": "2 days, 6:53:14", "remaining_time": "19:13:42", "throughput": 4373.83, "total_tokens": 864243216} | |
| {"current_steps": 2300, "total_steps": 3099, "loss": 0.0425, "lr": 9.482048194480275e-06, "epoch": 2.226552099721651, "percentage": 74.22, "elapsed_time": "2 days, 6:58:52", "remaining_time": "19:06:00", "throughput": 4376.07, "total_tokens": 866168848} | |
| {"current_steps": 2305, "total_steps": 3099, "loss": 0.0431, "lr": 9.371900716110183e-06, "epoch": 2.23139295655331, "percentage": 74.38, "elapsed_time": "2 days, 7:03:58", "remaining_time": "18:58:07", "throughput": 4378.76, "total_tokens": 868041296} | |
| {"current_steps": 2310, "total_steps": 3099, "loss": 0.046, "lr": 9.262248970636334e-06, "epoch": 2.236233813384969, "percentage": 74.54, "elapsed_time": "2 days, 7:08:51", "remaining_time": "18:50:10", "throughput": 4381.55, "total_tokens": 869878384} | |
| {"current_steps": 2315, "total_steps": 3099, "loss": 0.042, "lr": 9.153096436279327e-06, "epoch": 2.241074670216628, "percentage": 74.7, "elapsed_time": "2 days, 7:13:37", "remaining_time": "18:42:11", "throughput": 4384.37, "total_tokens": 871688688} | |
| {"current_steps": 2320, "total_steps": 3099, "loss": 0.0431, "lr": 9.044446575424548e-06, "epoch": 2.2459155270482873, "percentage": 74.86, "elapsed_time": "2 days, 7:20:28", "remaining_time": "18:34:56", "throughput": 4385.57, "total_tokens": 873728640} | |
| {"current_steps": 2325, "total_steps": 3099, "loss": 0.0439, "lr": 8.936302834512206e-06, "epoch": 2.250756383879947, "percentage": 75.02, "elapsed_time": "2 days, 7:25:49", "remaining_time": "18:27:10", "throughput": 4387.89, "total_tokens": 875601696} | |
| {"current_steps": 2330, "total_steps": 3099, "loss": 0.0419, "lr": 8.828668643928112e-06, "epoch": 2.255597240711606, "percentage": 75.19, "elapsed_time": "2 days, 7:31:48", "remaining_time": "18:19:38", "throughput": 4389.81, "total_tokens": 877559760} | |
| {"current_steps": 2335, "total_steps": 3099, "loss": 0.0432, "lr": 8.721547417894816e-06, "epoch": 2.260438097543265, "percentage": 75.35, "elapsed_time": "2 days, 7:36:55", "remaining_time": "18:11:49", "throughput": 4392.23, "total_tokens": 879392576} | |
| {"current_steps": 2340, "total_steps": 3099, "loss": 0.0453, "lr": 8.614942554363326e-06, "epoch": 2.2652789543749243, "percentage": 75.51, "elapsed_time": "2 days, 7:41:40", "remaining_time": "18:03:54", "throughput": 4394.9, "total_tokens": 881180800} | |
| {"current_steps": 2345, "total_steps": 3099, "loss": 0.0423, "lr": 8.508857434905304e-06, "epoch": 2.2701198112065835, "percentage": 75.67, "elapsed_time": "2 days, 7:47:01", "remaining_time": "17:56:11", "throughput": 4397.18, "total_tokens": 883048928} | |
| {"current_steps": 2350, "total_steps": 3099, "loss": 0.0424, "lr": 8.40329542460582e-06, "epoch": 2.2749606680382426, "percentage": 75.83, "elapsed_time": "2 days, 7:52:36", "remaining_time": "17:48:33", "throughput": 4399.56, "total_tokens": 885000208} | |
| {"current_steps": 2355, "total_steps": 3099, "loss": 0.0432, "lr": 8.298259871956596e-06, "epoch": 2.279801524869902, "percentage": 75.99, "elapsed_time": "2 days, 7:58:14", "remaining_time": "17:40:56", "throughput": 4401.8, "total_tokens": 886939040} | |
| {"current_steps": 2360, "total_steps": 3099, "loss": 0.0408, "lr": 8.193754108749793e-06, "epoch": 2.2846423817015613, "percentage": 76.15, "elapsed_time": "2 days, 8:04:13", "remaining_time": "17:33:27", "throughput": 4403.97, "total_tokens": 888957616} | |
| {"current_steps": 2365, "total_steps": 3099, "loss": 0.0427, "lr": 8.08978144997234e-06, "epoch": 2.2894832385332204, "percentage": 76.31, "elapsed_time": "2 days, 8:08:51", "remaining_time": "17:25:33", "throughput": 4406.8, "total_tokens": 890755008} | |
| {"current_steps": 2370, "total_steps": 3099, "loss": 0.0414, "lr": 7.986345193700726e-06, "epoch": 2.2943240953648796, "percentage": 76.48, "elapsed_time": "2 days, 8:14:31", "remaining_time": "17:17:59", "throughput": 4408.89, "total_tokens": 892675136} | |
| {"current_steps": 2375, "total_steps": 3099, "loss": 0.0427, "lr": 7.883448620996489e-06, "epoch": 2.2991649521965387, "percentage": 76.64, "elapsed_time": "2 days, 8:19:03", "remaining_time": "17:10:04", "throughput": 4411.77, "total_tokens": 894455920} | |
| {"current_steps": 2380, "total_steps": 3099, "loss": 0.0485, "lr": 7.781094995802007e-06, "epoch": 2.304005809028198, "percentage": 76.8, "elapsed_time": "2 days, 8:24:52", "remaining_time": "17:02:34", "throughput": 4413.44, "total_tokens": 896339664} | |
| {"current_steps": 2385, "total_steps": 3099, "loss": 0.0417, "lr": 7.679287564837074e-06, "epoch": 2.308846665859857, "percentage": 76.96, "elapsed_time": "2 days, 8:29:52", "remaining_time": "16:54:49", "throughput": 4415.93, "total_tokens": 898166624} | |
| {"current_steps": 2390, "total_steps": 3099, "loss": 0.0408, "lr": 7.57802955749585e-06, "epoch": 2.3136875226915166, "percentage": 77.12, "elapsed_time": "2 days, 8:35:57", "remaining_time": "16:47:25", "throughput": 4417.9, "total_tokens": 900181312} | |
| {"current_steps": 2395, "total_steps": 3099, "loss": 0.0423, "lr": 7.4773241857444415e-06, "epoch": 2.3185283795231757, "percentage": 77.28, "elapsed_time": "2 days, 8:41:29", "remaining_time": "16:39:51", "throughput": 4419.96, "total_tokens": 902067280} | |
| {"current_steps": 2400, "total_steps": 3099, "loss": 0.0417, "lr": 7.3771746440190195e-06, "epoch": 2.323369236354835, "percentage": 77.44, "elapsed_time": "2 days, 8:46:30", "remaining_time": "16:32:08", "throughput": 4422.73, "total_tokens": 903961952} | |
| {"current_steps": 2405, "total_steps": 3099, "loss": 0.0439, "lr": 7.277584109124483e-06, "epoch": 2.328210093186494, "percentage": 77.61, "elapsed_time": "2 days, 8:51:28", "remaining_time": "16:24:26", "throughput": 4425.08, "total_tokens": 905764752} | |
| {"current_steps": 2410, "total_steps": 3099, "loss": 0.0437, "lr": 7.178555740133694e-06, "epoch": 2.333050950018153, "percentage": 77.77, "elapsed_time": "2 days, 8:56:46", "remaining_time": "16:16:49", "throughput": 4427.37, "total_tokens": 907639040} | |
| {"current_steps": 2415, "total_steps": 3099, "loss": 0.0429, "lr": 7.080092678287262e-06, "epoch": 2.3378918068498122, "percentage": 77.93, "elapsed_time": "2 days, 9:02:42", "remaining_time": "16:09:24", "throughput": 4428.99, "total_tokens": 909548736} | |
| {"current_steps": 2420, "total_steps": 3099, "loss": 0.0403, "lr": 6.982198046893912e-06, "epoch": 2.3427326636814714, "percentage": 78.09, "elapsed_time": "2 days, 9:06:40", "remaining_time": "16:01:27", "throughput": 4432.72, "total_tokens": 911369184} | |
| {"current_steps": 2425, "total_steps": 3099, "loss": 0.0444, "lr": 6.884874951231407e-06, "epoch": 2.347573520513131, "percentage": 78.25, "elapsed_time": "2 days, 9:11:35", "remaining_time": "15:53:46", "throughput": 4435.43, "total_tokens": 913234896} | |
| {"current_steps": 2430, "total_steps": 3099, "loss": 0.045, "lr": 6.788126478448046e-06, "epoch": 2.35241437734479, "percentage": 78.41, "elapsed_time": "2 days, 9:17:25", "remaining_time": "15:46:21", "throughput": 4437.19, "total_tokens": 915148176} | |
| {"current_steps": 2435, "total_steps": 3099, "loss": 0.0438, "lr": 6.691955697464722e-06, "epoch": 2.357255234176449, "percentage": 78.57, "elapsed_time": "2 days, 9:24:05", "remaining_time": "15:39:10", "throughput": 4438.01, "total_tokens": 917092976} | |
| {"current_steps": 2440, "total_steps": 3099, "loss": 0.0424, "lr": 6.596365658877612e-06, "epoch": 2.3620960910081084, "percentage": 78.74, "elapsed_time": "2 days, 9:30:17", "remaining_time": "15:31:51", "throughput": 4439.57, "total_tokens": 919066720} | |
| {"current_steps": 2445, "total_steps": 3099, "loss": 0.0417, "lr": 6.501359394861378e-06, "epoch": 2.3669369478397675, "percentage": 78.9, "elapsed_time": "2 days, 9:34:44", "remaining_time": "15:24:05", "throughput": 4442.51, "total_tokens": 920862256} | |
| {"current_steps": 2450, "total_steps": 3099, "loss": 0.045, "lr": 6.4069399190729965e-06, "epoch": 2.371777804671427, "percentage": 79.06, "elapsed_time": "2 days, 9:38:47", "remaining_time": "15:16:13", "throughput": 4445.83, "total_tokens": 922629344} | |
| {"current_steps": 2455, "total_steps": 3099, "loss": 0.0428, "lr": 6.3131102265561595e-06, "epoch": 2.376618661503086, "percentage": 79.22, "elapsed_time": "2 days, 9:43:30", "remaining_time": "15:08:33", "throughput": 4448.57, "total_tokens": 924459968} | |
| {"current_steps": 2460, "total_steps": 3099, "loss": 0.0434, "lr": 6.219873293646275e-06, "epoch": 2.3814595183347453, "percentage": 79.38, "elapsed_time": "2 days, 9:48:17", "remaining_time": "15:00:54", "throughput": 4451.19, "total_tokens": 926282784} | |
| {"current_steps": 2465, "total_steps": 3099, "loss": 0.0423, "lr": 6.127232077876044e-06, "epoch": 2.3863003751664045, "percentage": 79.54, "elapsed_time": "2 days, 9:53:15", "remaining_time": "14:53:19", "throughput": 4453.57, "total_tokens": 928104928} | |
| {"current_steps": 2470, "total_steps": 3099, "loss": 0.0414, "lr": 6.0351895178816675e-06, "epoch": 2.3911412319980636, "percentage": 79.7, "elapsed_time": "2 days, 9:59:12", "remaining_time": "14:46:00", "throughput": 4455.2, "total_tokens": 930034976} | |
| {"current_steps": 2475, "total_steps": 3099, "loss": 0.0403, "lr": 5.943748533309609e-06, "epoch": 2.3959820888297227, "percentage": 79.86, "elapsed_time": "2 days, 10:03:49", "remaining_time": "14:38:20", "throughput": 4458.07, "total_tokens": 931869680} | |
| {"current_steps": 2480, "total_steps": 3099, "loss": 0.0426, "lr": 5.8529120247239945e-06, "epoch": 2.400822945661382, "percentage": 80.03, "elapsed_time": "2 days, 10:10:10", "remaining_time": "14:31:08", "throughput": 4459.29, "total_tokens": 933822272} | |
| {"current_steps": 2485, "total_steps": 3099, "loss": 0.041, "lr": 5.762682873514605e-06, "epoch": 2.4056638024930415, "percentage": 80.19, "elapsed_time": "2 days, 10:14:40", "remaining_time": "14:23:28", "throughput": 4462.39, "total_tokens": 935677664} | |
| {"current_steps": 2490, "total_steps": 3099, "loss": 0.0445, "lr": 5.673063941805451e-06, "epoch": 2.4105046593247006, "percentage": 80.35, "elapsed_time": "2 days, 10:19:56", "remaining_time": "14:16:00", "throughput": 4464.63, "total_tokens": 937557696} | |
| {"current_steps": 2495, "total_steps": 3099, "loss": 0.0403, "lr": 5.584058072364032e-06, "epoch": 2.4153455161563597, "percentage": 80.51, "elapsed_time": "2 days, 10:24:15", "remaining_time": "14:08:19", "throughput": 4468.13, "total_tokens": 939447456} | |
| {"current_steps": 2500, "total_steps": 3099, "loss": 0.0413, "lr": 5.495668088511128e-06, "epoch": 2.420186372988019, "percentage": 80.67, "elapsed_time": "2 days, 10:30:34", "remaining_time": "14:01:08", "throughput": 4469.23, "total_tokens": 941372928} | |
| {"current_steps": 2505, "total_steps": 3099, "loss": 0.0435, "lr": 5.407896794031245e-06, "epoch": 2.425027229819678, "percentage": 80.83, "elapsed_time": "2 days, 10:35:47", "remaining_time": "13:53:41", "throughput": 4471.36, "total_tokens": 943222032} | |
| {"current_steps": 2510, "total_steps": 3099, "loss": 0.0424, "lr": 5.3207469730836875e-06, "epoch": 2.429868086651337, "percentage": 80.99, "elapsed_time": "2 days, 10:41:27", "remaining_time": "13:46:21", "throughput": 4473.24, "total_tokens": 945141472} | |
| {"current_steps": 2515, "total_steps": 3099, "loss": 0.042, "lr": 5.2342213901142415e-06, "epoch": 2.4347089434829963, "percentage": 81.16, "elapsed_time": "2 days, 10:45:59", "remaining_time": "13:38:45", "throughput": 4476.02, "total_tokens": 946942384} | |
| {"current_steps": 2520, "total_steps": 3099, "loss": 0.0424, "lr": 5.1483227897674736e-06, "epoch": 2.439549800314656, "percentage": 81.32, "elapsed_time": "2 days, 10:50:58", "remaining_time": "13:31:16", "throughput": 4478.45, "total_tokens": 948797600} | |
| {"current_steps": 2525, "total_steps": 3099, "loss": 0.044, "lr": 5.0630538967996824e-06, "epoch": 2.444390657146315, "percentage": 81.48, "elapsed_time": "2 days, 10:57:19", "remaining_time": "13:24:07", "throughput": 4479.56, "total_tokens": 950738128} | |
| {"current_steps": 2530, "total_steps": 3099, "loss": 0.0414, "lr": 4.978417415992459e-06, "epoch": 2.449231513977974, "percentage": 81.64, "elapsed_time": "2 days, 11:02:39", "remaining_time": "13:16:44", "throughput": 4481.95, "total_tokens": 952683104} | |
| {"current_steps": 2535, "total_steps": 3099, "loss": 0.044, "lr": 4.8944160320668925e-06, "epoch": 2.4540723708096333, "percentage": 81.8, "elapsed_time": "2 days, 11:07:43", "remaining_time": "13:09:19", "throughput": 4484.4, "total_tokens": 954565248} | |
| {"current_steps": 2540, "total_steps": 3099, "loss": 0.0435, "lr": 4.811052409598415e-06, "epoch": 2.4589132276412924, "percentage": 81.96, "elapsed_time": "2 days, 11:13:25", "remaining_time": "13:02:01", "throughput": 4486.09, "total_tokens": 956458752} | |
| {"current_steps": 2545, "total_steps": 3099, "loss": 0.0434, "lr": 4.728329192932277e-06, "epoch": 2.4637540844729515, "percentage": 82.12, "elapsed_time": "2 days, 11:19:00", "remaining_time": "12:54:43", "throughput": 4487.95, "total_tokens": 958360512} | |
| {"current_steps": 2550, "total_steps": 3099, "loss": 0.0433, "lr": 4.64624900609964e-06, "epoch": 2.468594941304611, "percentage": 82.28, "elapsed_time": "2 days, 11:23:46", "remaining_time": "12:47:15", "throughput": 4490.74, "total_tokens": 960237872} | |
| {"current_steps": 2555, "total_steps": 3099, "loss": 0.0413, "lr": 4.56481445273439e-06, "epoch": 2.4734357981362702, "percentage": 82.45, "elapsed_time": "2 days, 11:30:14", "remaining_time": "12:40:09", "throughput": 4491.97, "total_tokens": 962247008} | |
| {"current_steps": 2560, "total_steps": 3099, "loss": 0.0414, "lr": 4.4840281159905155e-06, "epoch": 2.4782766549679294, "percentage": 82.61, "elapsed_time": "2 days, 11:35:49", "remaining_time": "12:32:52", "throughput": 4493.93, "total_tokens": 964170272} | |
| {"current_steps": 2565, "total_steps": 3099, "loss": 0.0412, "lr": 4.403892558460177e-06, "epoch": 2.4831175117995885, "percentage": 82.77, "elapsed_time": "2 days, 11:42:08", "remaining_time": "12:25:45", "throughput": 4495.07, "total_tokens": 966120000} | |
| {"current_steps": 2570, "total_steps": 3099, "loss": 0.0412, "lr": 4.324410322092415e-06, "epoch": 2.4879583686312476, "percentage": 82.93, "elapsed_time": "2 days, 11:46:51", "remaining_time": "12:18:18", "throughput": 4497.72, "total_tokens": 967960784} | |
| {"current_steps": 2575, "total_steps": 3099, "loss": 0.0417, "lr": 4.2455839281125256e-06, "epoch": 2.4927992254629068, "percentage": 83.09, "elapsed_time": "2 days, 11:51:54", "remaining_time": "12:10:56", "throughput": 4500.14, "total_tokens": 969844080} | |
| {"current_steps": 2580, "total_steps": 3099, "loss": 0.0417, "lr": 4.167415876942085e-06, "epoch": 2.4976400822945664, "percentage": 83.25, "elapsed_time": "2 days, 11:56:57", "remaining_time": "12:03:34", "throughput": 4502.38, "total_tokens": 971694160} | |
| {"current_steps": 2585, "total_steps": 3099, "loss": 0.0425, "lr": 4.089908648119625e-06, "epoch": 2.5024809391262255, "percentage": 83.41, "elapsed_time": "2 days, 12:01:48", "remaining_time": "11:56:10", "throughput": 4504.9, "total_tokens": 973545824} | |
| {"current_steps": 2590, "total_steps": 3099, "loss": 0.0411, "lr": 4.013064700221991e-06, "epoch": 2.5073217959578846, "percentage": 83.58, "elapsed_time": "2 days, 12:07:28", "remaining_time": "11:48:57", "throughput": 4506.65, "total_tokens": 975457776} | |
| {"current_steps": 2595, "total_steps": 3099, "loss": 0.0405, "lr": 3.936886470786347e-06, "epoch": 2.5121626527895438, "percentage": 83.74, "elapsed_time": "2 days, 12:12:49", "remaining_time": "11:41:40", "throughput": 4508.77, "total_tokens": 977366416} | |
| {"current_steps": 2600, "total_steps": 3099, "loss": 0.0432, "lr": 3.8613763762328695e-06, "epoch": 2.517003509621203, "percentage": 83.9, "elapsed_time": "2 days, 12:17:52", "remaining_time": "11:34:21", "throughput": 4511.22, "total_tokens": 979260288} | |
| {"current_steps": 2605, "total_steps": 3099, "loss": 0.0441, "lr": 3.7865368117880688e-06, "epoch": 2.521844366452862, "percentage": 84.06, "elapsed_time": "2 days, 12:23:16", "remaining_time": "11:27:06", "throughput": 4513.24, "total_tokens": 981164192} | |
| {"current_steps": 2610, "total_steps": 3099, "loss": 0.041, "lr": 3.712370151408842e-06, "epoch": 2.526685223284521, "percentage": 84.22, "elapsed_time": "2 days, 12:28:21", "remaining_time": "11:19:47", "throughput": 4515.46, "total_tokens": 983019680} | |
| {"current_steps": 2615, "total_steps": 3099, "loss": 0.0382, "lr": 3.6388787477071557e-06, "epoch": 2.5315260801161807, "percentage": 84.38, "elapsed_time": "2 days, 12:33:58", "remaining_time": "11:12:35", "throughput": 4517.31, "total_tokens": 984946480} | |
| {"current_steps": 2620, "total_steps": 3099, "loss": 0.0431, "lr": 3.5660649318754153e-06, "epoch": 2.53636693694784, "percentage": 84.54, "elapsed_time": "2 days, 12:39:23", "remaining_time": "11:05:22", "throughput": 4519.17, "total_tokens": 986820704} | |
| {"current_steps": 2625, "total_steps": 3099, "loss": 0.0404, "lr": 3.493931013612528e-06, "epoch": 2.541207793779499, "percentage": 84.7, "elapsed_time": "2 days, 12:44:21", "remaining_time": "10:58:04", "throughput": 4521.53, "total_tokens": 988683712} | |
| {"current_steps": 2630, "total_steps": 3099, "loss": 0.0412, "lr": 3.4224792810506335e-06, "epoch": 2.546048650611158, "percentage": 84.87, "elapsed_time": "2 days, 12:50:31", "remaining_time": "10:50:59", "throughput": 4522.71, "total_tokens": 990613776} | |
| {"current_steps": 2635, "total_steps": 3099, "loss": 0.0421, "lr": 3.3517120006825137e-06, "epoch": 2.5508895074428173, "percentage": 85.03, "elapsed_time": "2 days, 12:56:07", "remaining_time": "10:43:48", "throughput": 4524.44, "total_tokens": 992516752} | |
| {"current_steps": 2640, "total_steps": 3099, "loss": 0.0433, "lr": 3.2816314172897183e-06, "epoch": 2.5557303642744764, "percentage": 85.19, "elapsed_time": "2 days, 13:01:24", "remaining_time": "10:36:35", "throughput": 4526.4, "total_tokens": 994379968} | |
| {"current_steps": 2645, "total_steps": 3099, "loss": 0.0413, "lr": 3.2122397538713432e-06, "epoch": 2.5605712211061356, "percentage": 85.35, "elapsed_time": "2 days, 13:08:32", "remaining_time": "10:29:41", "throughput": 4526.66, "total_tokens": 996372960} | |
| {"current_steps": 2650, "total_steps": 3099, "loss": 0.0445, "lr": 3.143539211573518e-06, "epoch": 2.565412077937795, "percentage": 85.51, "elapsed_time": "2 days, 13:12:48", "remaining_time": "10:22:17", "throughput": 4529.44, "total_tokens": 998147504} | |
| {"current_steps": 2655, "total_steps": 3099, "loss": 0.0402, "lr": 3.075531969619594e-06, "epoch": 2.5702529347694543, "percentage": 85.67, "elapsed_time": "2 days, 13:18:03", "remaining_time": "10:15:05", "throughput": 4531.43, "total_tokens": 1000010032} | |
| {"current_steps": 2660, "total_steps": 3099, "loss": 0.0394, "lr": 3.00822018524099e-06, "epoch": 2.5750937916011134, "percentage": 85.83, "elapsed_time": "2 days, 13:23:11", "remaining_time": "10:07:51", "throughput": 4533.71, "total_tokens": 1001911504} | |
| {"current_steps": 2665, "total_steps": 3099, "loss": 0.0405, "lr": 2.9416059936088176e-06, "epoch": 2.5799346484327725, "percentage": 86.0, "elapsed_time": "2 days, 13:29:29", "remaining_time": "10:00:50", "throughput": 4535.02, "total_tokens": 1003915536} | |
| {"current_steps": 2670, "total_steps": 3099, "loss": 0.042, "lr": 2.8756915077660816e-06, "epoch": 2.5847755052644317, "percentage": 86.16, "elapsed_time": "2 days, 13:34:39", "remaining_time": "9:53:38", "throughput": 4537.12, "total_tokens": 1005786320} | |
| {"current_steps": 2675, "total_steps": 3099, "loss": 0.046, "lr": 2.810478818560719e-06, "epoch": 2.5896163620960913, "percentage": 86.32, "elapsed_time": "2 days, 13:39:25", "remaining_time": "9:46:22", "throughput": 4539.3, "total_tokens": 1007566272} | |
| {"current_steps": 2680, "total_steps": 3099, "loss": 0.0429, "lr": 2.745969994579231e-06, "epoch": 2.59445721892775, "percentage": 86.48, "elapsed_time": "2 days, 13:44:53", "remaining_time": "9:39:14", "throughput": 4541.06, "total_tokens": 1009450528} | |
| {"current_steps": 2685, "total_steps": 3099, "loss": 0.0413, "lr": 2.6821670820810883e-06, "epoch": 2.5992980757594095, "percentage": 86.64, "elapsed_time": "2 days, 13:50:08", "remaining_time": "9:32:04", "throughput": 4542.95, "total_tokens": 1011300880} | |
| {"current_steps": 2690, "total_steps": 3099, "loss": 0.0406, "lr": 2.6190721049338145e-06, "epoch": 2.6041389325910687, "percentage": 86.8, "elapsed_time": "2 days, 13:54:47", "remaining_time": "9:24:48", "throughput": 4545.53, "total_tokens": 1013140688} | |
| {"current_steps": 2695, "total_steps": 3099, "loss": 0.0423, "lr": 2.5566870645487906e-06, "epoch": 2.608979789422728, "percentage": 86.96, "elapsed_time": "2 days, 14:00:08", "remaining_time": "9:17:40", "throughput": 4547.4, "total_tokens": 1015019296} | |
| {"current_steps": 2700, "total_steps": 3099, "loss": 0.0395, "lr": 2.495013939817767e-06, "epoch": 2.613820646254387, "percentage": 87.12, "elapsed_time": "2 days, 14:05:24", "remaining_time": "9:10:32", "throughput": 4549.35, "total_tokens": 1016892176} | |
| {"current_steps": 2705, "total_steps": 3099, "loss": 0.0405, "lr": 2.434054687050091e-06, "epoch": 2.618661503086046, "percentage": 87.29, "elapsed_time": "2 days, 14:10:26", "remaining_time": "9:03:21", "throughput": 4551.73, "total_tokens": 1018797600} | |
| {"current_steps": 2710, "total_steps": 3099, "loss": 0.0454, "lr": 2.3738112399106644e-06, "epoch": 2.6235023599177056, "percentage": 87.45, "elapsed_time": "2 days, 14:16:29", "remaining_time": "8:56:20", "throughput": 4552.93, "total_tokens": 1020718416} | |
| {"current_steps": 2715, "total_steps": 3099, "loss": 0.0428, "lr": 2.314285509358566e-06, "epoch": 2.6283432167493648, "percentage": 87.61, "elapsed_time": "2 days, 14:20:54", "remaining_time": "8:49:06", "throughput": 4555.6, "total_tokens": 1022524336} | |
| {"current_steps": 2720, "total_steps": 3099, "loss": 0.0406, "lr": 2.255479383586509e-06, "epoch": 2.633184073581024, "percentage": 87.77, "elapsed_time": "2 days, 14:25:43", "remaining_time": "8:41:55", "throughput": 4558.04, "total_tokens": 1024388192} | |
| {"current_steps": 2725, "total_steps": 3099, "loss": 0.0408, "lr": 2.197394727960861e-06, "epoch": 2.638024930412683, "percentage": 87.93, "elapsed_time": "2 days, 14:30:54", "remaining_time": "8:34:48", "throughput": 4559.87, "total_tokens": 1026219264} | |
| {"current_steps": 2730, "total_steps": 3099, "loss": 0.0392, "lr": 2.1400333849625338e-06, "epoch": 2.642865787244342, "percentage": 88.09, "elapsed_time": "2 days, 14:36:55", "remaining_time": "8:27:48", "throughput": 4561.63, "total_tokens": 1028260624} | |
| {"current_steps": 2735, "total_steps": 3099, "loss": 0.0415, "lr": 2.083397174128518e-06, "epoch": 2.6477066440760013, "percentage": 88.25, "elapsed_time": "2 days, 14:42:21", "remaining_time": "8:20:43", "throughput": 4563.45, "total_tokens": 1030159584} | |
| {"current_steps": 2740, "total_steps": 3099, "loss": 0.0432, "lr": 2.027487891994162e-06, "epoch": 2.6525475009076604, "percentage": 88.42, "elapsed_time": "2 days, 14:48:12", "remaining_time": "8:13:43", "throughput": 4564.88, "total_tokens": 1032081920} | |
| {"current_steps": 2745, "total_steps": 3099, "loss": 0.0425, "lr": 1.9723073120361924e-06, "epoch": 2.65738835773932, "percentage": 88.58, "elapsed_time": "2 days, 14:53:01", "remaining_time": "8:06:34", "throughput": 4567.21, "total_tokens": 1033931904} | |
| {"current_steps": 2750, "total_steps": 3099, "loss": 0.0397, "lr": 1.9178571846164532e-06, "epoch": 2.662229214570979, "percentage": 88.74, "elapsed_time": "2 days, 14:58:24", "remaining_time": "7:59:30", "throughput": 4568.98, "total_tokens": 1035806768} | |
| {"current_steps": 2755, "total_steps": 3099, "loss": 0.04, "lr": 1.8641392369263933e-06, "epoch": 2.6670700714026383, "percentage": 88.9, "elapsed_time": "2 days, 15:04:31", "remaining_time": "7:52:33", "throughput": 4570.28, "total_tokens": 1037779856} | |
| {"current_steps": 2760, "total_steps": 3099, "loss": 0.0439, "lr": 1.8111551729322662e-06, "epoch": 2.6719109282342974, "percentage": 89.06, "elapsed_time": "2 days, 15:09:56", "remaining_time": "7:45:30", "throughput": 4571.77, "total_tokens": 1039606192} | |
| {"current_steps": 2765, "total_steps": 3099, "loss": 0.0473, "lr": 1.7589066733210814e-06, "epoch": 2.6767517850659566, "percentage": 89.22, "elapsed_time": "2 days, 15:14:39", "remaining_time": "7:38:22", "throughput": 4573.76, "total_tokens": 1041352016} | |
| {"current_steps": 2770, "total_steps": 3099, "loss": 0.0432, "lr": 1.7073953954472949e-06, "epoch": 2.681592641897616, "percentage": 89.38, "elapsed_time": "2 days, 15:20:04", "remaining_time": "7:31:20", "throughput": 4575.4, "total_tokens": 1043209584} | |
| {"current_steps": 2775, "total_steps": 3099, "loss": 0.0423, "lr": 1.6566229732802501e-06, "epoch": 2.686433498729275, "percentage": 89.55, "elapsed_time": "2 days, 15:25:27", "remaining_time": "7:24:18", "throughput": 4577.07, "total_tokens": 1045070400} | |
| {"current_steps": 2780, "total_steps": 3099, "loss": 0.0404, "lr": 1.6065910173523101e-06, "epoch": 2.6912743555609344, "percentage": 89.71, "elapsed_time": "2 days, 15:30:49", "remaining_time": "7:17:17", "throughput": 4579.19, "total_tokens": 1047027216} | |
| {"current_steps": 2785, "total_steps": 3099, "loss": 0.0407, "lr": 1.5573011147078236e-06, "epoch": 2.6961152123925936, "percentage": 89.87, "elapsed_time": "2 days, 15:36:07", "remaining_time": "7:10:15", "throughput": 4581.14, "total_tokens": 1048933616} | |
| {"current_steps": 2790, "total_steps": 3099, "loss": 0.0416, "lr": 1.5087548288527291e-06, "epoch": 2.7009560692242527, "percentage": 90.03, "elapsed_time": "2 days, 15:40:38", "remaining_time": "7:03:08", "throughput": 4583.58, "total_tokens": 1050730672} | |
| {"current_steps": 2795, "total_steps": 3099, "loss": 0.0415, "lr": 1.4609536997049977e-06, "epoch": 2.705796926055912, "percentage": 90.19, "elapsed_time": "2 days, 15:45:45", "remaining_time": "6:56:06", "throughput": 4585.62, "total_tokens": 1052607296} | |
| {"current_steps": 2800, "total_steps": 3099, "loss": 0.041, "lr": 1.4138992435457688e-06, "epoch": 2.710637782887571, "percentage": 90.35, "elapsed_time": "2 days, 15:51:14", "remaining_time": "6:49:07", "throughput": 4587.41, "total_tokens": 1054530832} | |
| {"current_steps": 2805, "total_steps": 3099, "loss": 0.0404, "lr": 1.3675929529712555e-06, "epoch": 2.7154786397192305, "percentage": 90.51, "elapsed_time": "2 days, 15:57:09", "remaining_time": "6:42:10", "throughput": 4588.95, "total_tokens": 1056509856} | |
| {"current_steps": 2810, "total_steps": 3099, "loss": 0.041, "lr": 1.3220362968454026e-06, "epoch": 2.7203194965508897, "percentage": 90.67, "elapsed_time": "2 days, 16:03:03", "remaining_time": "6:35:14", "throughput": 4590.05, "total_tokens": 1058388320} | |
| {"current_steps": 2815, "total_steps": 3099, "loss": 0.0416, "lr": 1.277230720253289e-06, "epoch": 2.725160353382549, "percentage": 90.84, "elapsed_time": "2 days, 16:07:42", "remaining_time": "6:28:11", "throughput": 4592.39, "total_tokens": 1060208912} | |
| {"current_steps": 2820, "total_steps": 3099, "loss": 0.042, "lr": 1.2331776444552939e-06, "epoch": 2.730001210214208, "percentage": 91.0, "elapsed_time": "2 days, 16:13:53", "remaining_time": "6:21:17", "throughput": 4593.53, "total_tokens": 1062178720} | |
| {"current_steps": 2825, "total_steps": 3099, "loss": 0.0409, "lr": 1.1898784668419927e-06, "epoch": 2.734842067045867, "percentage": 91.16, "elapsed_time": "2 days, 16:19:26", "remaining_time": "6:14:19", "throughput": 4595.3, "total_tokens": 1064115760} | |
| {"current_steps": 2830, "total_steps": 3099, "loss": 0.0433, "lr": 1.1473345608898789e-06, "epoch": 2.739682923877526, "percentage": 91.32, "elapsed_time": "2 days, 16:24:36", "remaining_time": "6:07:20", "throughput": 4597.14, "total_tokens": 1065971408} | |
| {"current_steps": 2835, "total_steps": 3099, "loss": 0.0433, "lr": 1.10554727611773e-06, "epoch": 2.7445237807091853, "percentage": 91.48, "elapsed_time": "2 days, 16:30:37", "remaining_time": "6:00:26", "throughput": 4598.27, "total_tokens": 1067891024} | |
| {"current_steps": 2840, "total_steps": 3099, "loss": 0.0433, "lr": 1.0645179380438657e-06, "epoch": 2.749364637540845, "percentage": 91.64, "elapsed_time": "2 days, 16:36:18", "remaining_time": "5:53:30", "throughput": 4599.49, "total_tokens": 1069744096} | |
| {"current_steps": 2845, "total_steps": 3099, "loss": 0.0395, "lr": 1.0242478481440498e-06, "epoch": 2.754205494372504, "percentage": 91.8, "elapsed_time": "2 days, 16:40:55", "remaining_time": "5:46:29", "throughput": 4601.99, "total_tokens": 1071601856} | |
| {"current_steps": 2850, "total_steps": 3099, "loss": 0.0421, "lr": 9.847382838102492e-07, "epoch": 2.759046351204163, "percentage": 91.97, "elapsed_time": "2 days, 16:46:06", "remaining_time": "5:39:31", "throughput": 4603.92, "total_tokens": 1073480480} | |
| {"current_steps": 2855, "total_steps": 3099, "loss": 0.0404, "lr": 9.459904983100704e-07, "epoch": 2.7638872080358223, "percentage": 92.13, "elapsed_time": "2 days, 16:51:13", "remaining_time": "5:32:33", "throughput": 4606.09, "total_tokens": 1075401632} | |
| {"current_steps": 2860, "total_steps": 3099, "loss": 0.0379, "lr": 9.080057207470405e-07, "epoch": 2.7687280648674815, "percentage": 92.29, "elapsed_time": "2 days, 16:56:46", "remaining_time": "5:25:38", "throughput": 4607.81, "total_tokens": 1077335872} | |
| {"current_steps": 2865, "total_steps": 3099, "loss": 0.0403, "lr": 8.707851560216112e-07, "epoch": 2.7735689216991406, "percentage": 92.45, "elapsed_time": "2 days, 17:02:44", "remaining_time": "5:18:45", "throughput": 4609.19, "total_tokens": 1079310576} | |
| {"current_steps": 2870, "total_steps": 3099, "loss": 0.0387, "lr": 8.343299847929226e-07, "epoch": 2.7784097785307997, "percentage": 92.61, "elapsed_time": "2 days, 17:08:03", "remaining_time": "5:11:49", "throughput": 4611.17, "total_tokens": 1081245280} | |
| {"current_steps": 2875, "total_steps": 3099, "loss": 0.0423, "lr": 7.986413634413686e-07, "epoch": 2.7832506353624593, "percentage": 92.77, "elapsed_time": "2 days, 17:14:28", "remaining_time": "5:04:59", "throughput": 4611.85, "total_tokens": 1083177952} | |
| {"current_steps": 2880, "total_steps": 3099, "loss": 0.0415, "lr": 7.637204240319163e-07, "epoch": 2.7880914921941184, "percentage": 92.93, "elapsed_time": "2 days, 17:19:57", "remaining_time": "4:58:04", "throughput": 4613.46, "total_tokens": 1085074640} | |
| {"current_steps": 2885, "total_steps": 3099, "loss": 0.04, "lr": 7.295682742781862e-07, "epoch": 2.7929323490257776, "percentage": 93.09, "elapsed_time": "2 days, 17:24:44", "remaining_time": "4:51:07", "throughput": 4615.6, "total_tokens": 1086903600} | |
| {"current_steps": 2890, "total_steps": 3099, "loss": 0.0407, "lr": 6.961859975073121e-07, "epoch": 2.7977732058574367, "percentage": 93.26, "elapsed_time": "2 days, 17:29:01", "remaining_time": "4:44:08", "throughput": 4618.29, "total_tokens": 1088720960} | |
| {"current_steps": 2895, "total_steps": 3099, "loss": 0.0399, "lr": 6.635746526255981e-07, "epoch": 2.802614062689096, "percentage": 93.42, "elapsed_time": "2 days, 17:33:40", "remaining_time": "4:37:11", "throughput": 4620.54, "total_tokens": 1090542208} | |
| {"current_steps": 2900, "total_steps": 3099, "loss": 0.0407, "lr": 6.317352740849048e-07, "epoch": 2.8074549195207554, "percentage": 93.58, "elapsed_time": "2 days, 17:39:07", "remaining_time": "4:30:18", "throughput": 4622.18, "total_tokens": 1092439568} | |
| {"current_steps": 2905, "total_steps": 3099, "loss": 0.0425, "lr": 6.006688718498549e-07, "epoch": 2.812295776352414, "percentage": 93.74, "elapsed_time": "2 days, 17:43:59", "remaining_time": "4:23:23", "throughput": 4624.11, "total_tokens": 1094246688} | |
| {"current_steps": 2910, "total_steps": 3099, "loss": 0.0426, "lr": 5.703764313657795e-07, "epoch": 2.8171366331840737, "percentage": 93.9, "elapsed_time": "2 days, 17:49:28", "remaining_time": "4:16:30", "throughput": 4625.7, "total_tokens": 1096143712} | |
| {"current_steps": 2915, "total_steps": 3099, "loss": 0.0411, "lr": 5.408589135274755e-07, "epoch": 2.821977490015733, "percentage": 94.06, "elapsed_time": "2 days, 17:54:44", "remaining_time": "4:09:37", "throughput": 4627.82, "total_tokens": 1098111104} | |
| {"current_steps": 2920, "total_steps": 3099, "loss": 0.0407, "lr": 5.121172546487196e-07, "epoch": 2.826818346847392, "percentage": 94.22, "elapsed_time": "2 days, 18:00:50", "remaining_time": "4:02:48", "throughput": 4628.88, "total_tokens": 1100058224} | |
| {"current_steps": 2925, "total_steps": 3099, "loss": 0.0397, "lr": 4.841523664325581e-07, "epoch": 2.831659203679051, "percentage": 94.39, "elapsed_time": "2 days, 18:05:40", "remaining_time": "3:55:54", "throughput": 4630.99, "total_tokens": 1101896720} | |
| {"current_steps": 2930, "total_steps": 3099, "loss": 0.0412, "lr": 4.5696513594240264e-07, "epoch": 2.8365000605107102, "percentage": 94.55, "elapsed_time": "2 days, 18:10:11", "remaining_time": "3:48:59", "throughput": 4633.46, "total_tokens": 1103744592} | |
| {"current_steps": 2935, "total_steps": 3099, "loss": 0.0407, "lr": 4.305564255738831e-07, "epoch": 2.84134091734237, "percentage": 94.71, "elapsed_time": "2 days, 18:15:30", "remaining_time": "3:42:08", "throughput": 4635.25, "total_tokens": 1105651136} | |
| {"current_steps": 2940, "total_steps": 3099, "loss": 0.0412, "lr": 4.0492707302749176e-07, "epoch": 2.846181774174029, "percentage": 94.87, "elapsed_time": "2 days, 18:20:07", "remaining_time": "3:35:15", "throughput": 4637.5, "total_tokens": 1107467904} | |
| {"current_steps": 2945, "total_steps": 3099, "loss": 0.041, "lr": 3.800778912820102e-07, "epoch": 2.851022631005688, "percentage": 95.03, "elapsed_time": "2 days, 18:25:01", "remaining_time": "3:28:23", "throughput": 4639.37, "total_tokens": 1109281136} | |
| {"current_steps": 2950, "total_steps": 3099, "loss": 0.041, "lr": 3.560096685687325e-07, "epoch": 2.8558634878373472, "percentage": 95.19, "elapsed_time": "2 days, 18:30:24", "remaining_time": "3:21:32", "throughput": 4640.99, "total_tokens": 1111166496} | |
| {"current_steps": 2955, "total_steps": 3099, "loss": 0.0408, "lr": 3.32723168346441e-07, "epoch": 2.8607043446690064, "percentage": 95.35, "elapsed_time": "2 days, 18:35:36", "remaining_time": "3:14:42", "throughput": 4642.71, "total_tokens": 1113024464} | |
| {"current_steps": 2960, "total_steps": 3099, "loss": 0.0428, "lr": 3.102191292772144e-07, "epoch": 2.8655452015006655, "percentage": 95.51, "elapsed_time": "2 days, 18:39:49", "remaining_time": "3:07:49", "throughput": 4645.15, "total_tokens": 1114789808} | |
| {"current_steps": 2965, "total_steps": 3099, "loss": 0.0414, "lr": 2.884982652029716e-07, "epoch": 2.8703860583323246, "percentage": 95.68, "elapsed_time": "2 days, 18:45:05", "remaining_time": "3:01:00", "throughput": 4647.06, "total_tokens": 1116715504} | |
| {"current_steps": 2970, "total_steps": 3099, "loss": 0.0423, "lr": 2.6756126512285094e-07, "epoch": 2.875226915163984, "percentage": 95.84, "elapsed_time": "2 days, 18:50:57", "remaining_time": "2:54:12", "throughput": 4648.36, "total_tokens": 1118661392} | |
| {"current_steps": 2975, "total_steps": 3099, "loss": 0.043, "lr": 2.4740879317133314e-07, "epoch": 2.8800677719956433, "percentage": 96.0, "elapsed_time": "2 days, 18:56:30", "remaining_time": "2:47:24", "throughput": 4649.66, "total_tokens": 1120523488} | |
| {"current_steps": 2980, "total_steps": 3099, "loss": 0.0425, "lr": 2.2804148859719433e-07, "epoch": 2.8849086288273025, "percentage": 96.16, "elapsed_time": "2 days, 19:01:06", "remaining_time": "2:40:34", "throughput": 4651.83, "total_tokens": 1122329216} | |
| {"current_steps": 2985, "total_steps": 3099, "loss": 0.0423, "lr": 2.0945996574321392e-07, "epoch": 2.8897494856589616, "percentage": 96.32, "elapsed_time": "2 days, 19:05:11", "remaining_time": "2:33:43", "throughput": 4654.47, "total_tokens": 1124108576} | |
| {"current_steps": 2990, "total_steps": 3099, "loss": 0.0416, "lr": 1.9166481402669856e-07, "epoch": 2.8945903424906207, "percentage": 96.48, "elapsed_time": "2 days, 19:09:53", "remaining_time": "2:26:54", "throughput": 4656.62, "total_tokens": 1125941808} | |
| {"current_steps": 2995, "total_steps": 3099, "loss": 0.0412, "lr": 1.7465659792077484e-07, "epoch": 2.89943119932228, "percentage": 96.64, "elapsed_time": "2 days, 19:14:39", "remaining_time": "2:20:06", "throughput": 4658.6, "total_tokens": 1127752624} | |
| {"current_steps": 3000, "total_steps": 3099, "loss": 0.0418, "lr": 1.5843585693648967e-07, "epoch": 2.904272056153939, "percentage": 96.81, "elapsed_time": "2 days, 19:19:28", "remaining_time": "2:13:18", "throughput": 4660.68, "total_tokens": 1129601232} | |
| {"current_steps": 3005, "total_steps": 3099, "loss": 0.041, "lr": 1.4300310560570184e-07, "epoch": 2.9091129129855986, "percentage": 96.97, "elapsed_time": "2 days, 19:24:00", "remaining_time": "2:06:30", "throughput": 4663.05, "total_tokens": 1131446736} | |
| {"current_steps": 3010, "total_steps": 3099, "loss": 0.0402, "lr": 1.2835883346474786e-07, "epoch": 2.9139537698172577, "percentage": 97.13, "elapsed_time": "2 days, 19:29:26", "remaining_time": "1:59:44", "throughput": 4664.67, "total_tokens": 1133359440} | |
| {"current_steps": 3015, "total_steps": 3099, "loss": 0.0413, "lr": 1.1450350503892648e-07, "epoch": 2.918794626648917, "percentage": 97.29, "elapsed_time": "2 days, 19:33:53", "remaining_time": "1:52:56", "throughput": 4666.92, "total_tokens": 1135150272} | |
| {"current_steps": 3020, "total_steps": 3099, "loss": 0.0397, "lr": 1.014375598277495e-07, "epoch": 2.923635483480576, "percentage": 97.45, "elapsed_time": "2 days, 19:39:13", "remaining_time": "1:46:11", "throughput": 4668.62, "total_tokens": 1137058240} | |
| {"current_steps": 3025, "total_steps": 3099, "loss": 0.0423, "lr": 8.916141229101671e-08, "epoch": 2.928476340312235, "percentage": 97.61, "elapsed_time": "2 days, 19:43:52", "remaining_time": "1:39:24", "throughput": 4670.75, "total_tokens": 1138880976} | |
| {"current_steps": 3030, "total_steps": 3099, "loss": 0.0417, "lr": 7.767545183565983e-08, "epoch": 2.9333171971438947, "percentage": 97.77, "elapsed_time": "2 days, 19:49:44", "remaining_time": "1:32:40", "throughput": 4671.89, "total_tokens": 1140802272} | |
| {"current_steps": 3035, "total_steps": 3099, "loss": 0.0408, "lr": 6.69800428033912e-08, "epoch": 2.9381580539755534, "percentage": 97.93, "elapsed_time": "2 days, 19:55:33", "remaining_time": "1:25:56", "throughput": 4673.09, "total_tokens": 1142726336} | |
| {"current_steps": 3040, "total_steps": 3099, "loss": 0.041, "lr": 5.707552445914366e-08, "epoch": 2.942998910807213, "percentage": 98.1, "elapsed_time": "2 days, 20:01:01", "remaining_time": "1:19:12", "throughput": 4674.44, "total_tokens": 1144590976} | |
| {"current_steps": 3045, "total_steps": 3099, "loss": 0.0408, "lr": 4.7962210980317946e-08, "epoch": 2.947839767638872, "percentage": 98.26, "elapsed_time": "2 days, 20:06:28", "remaining_time": "1:12:28", "throughput": 4675.98, "total_tokens": 1146496640} | |
| {"current_steps": 3050, "total_steps": 3099, "loss": 0.0418, "lr": 3.964039144680465e-08, "epoch": 2.9526806244705313, "percentage": 98.42, "elapsed_time": "2 days, 20:11:21", "remaining_time": "1:05:43", "throughput": 4677.88, "total_tokens": 1148333472} | |
| {"current_steps": 3055, "total_steps": 3099, "loss": 0.0423, "lr": 3.2110329831824825e-08, "epoch": 2.9575214813021904, "percentage": 98.58, "elapsed_time": "2 days, 20:16:47", "remaining_time": "0:59:00", "throughput": 4679.53, "total_tokens": 1150262528} | |
| {"current_steps": 3060, "total_steps": 3099, "loss": 0.0384, "lr": 2.537226499355616e-08, "epoch": 2.9623623381338495, "percentage": 98.74, "elapsed_time": "2 days, 20:21:30", "remaining_time": "0:52:16", "throughput": 4681.66, "total_tokens": 1152112096} | |
| {"current_steps": 3065, "total_steps": 3099, "loss": 0.0419, "lr": 1.942641066754458e-08, "epoch": 2.967203194965509, "percentage": 98.9, "elapsed_time": "2 days, 20:26:46", "remaining_time": "0:45:33", "throughput": 4683.23, "total_tokens": 1153978224} | |
| {"current_steps": 3070, "total_steps": 3099, "loss": 0.0414, "lr": 1.4272955459937453e-08, "epoch": 2.9720440517971682, "percentage": 99.06, "elapsed_time": "2 days, 20:32:33", "remaining_time": "0:38:50", "throughput": 4684.38, "total_tokens": 1155885360} | |
| {"current_steps": 3075, "total_steps": 3099, "loss": 0.0387, "lr": 9.912062841496705e-09, "epoch": 2.9768849086288274, "percentage": 99.23, "elapsed_time": "2 days, 20:37:45", "remaining_time": "0:32:08", "throughput": 4686.02, "total_tokens": 1157755504} | |
| {"current_steps": 3080, "total_steps": 3099, "loss": 0.042, "lr": 6.343871142411306e-09, "epoch": 2.9817257654604865, "percentage": 99.39, "elapsed_time": "2 days, 20:42:39", "remaining_time": "0:25:25", "throughput": 4687.94, "total_tokens": 1159608192} | |
| {"current_steps": 3085, "total_steps": 3099, "loss": 0.0407, "lr": 3.568493547909113e-09, "epoch": 2.9865666222921456, "percentage": 99.55, "elapsed_time": "2 days, 20:48:34", "remaining_time": "0:18:44", "throughput": 4689.18, "total_tokens": 1161579776} | |
| {"current_steps": 3090, "total_steps": 3099, "loss": 0.0391, "lr": 1.586018094670849e-09, "epoch": 2.991407479123805, "percentage": 99.71, "elapsed_time": "2 days, 20:53:02", "remaining_time": "0:12:02", "throughput": 4691.49, "total_tokens": 1163408592} | |
| {"current_steps": 3095, "total_steps": 3099, "loss": 0.0417, "lr": 3.965076680351176e-10, "epoch": 2.996248335955464, "percentage": 99.87, "elapsed_time": "2 days, 20:58:17", "remaining_time": "0:05:20", "throughput": 4693.09, "total_tokens": 1165284400} | |
| {"current_steps": 3099, "total_steps": 3099, "epoch": 3.0, "percentage": 100.0, "elapsed_time": "2 days, 21:03:34", "remaining_time": "0:00:00", "throughput": 4693.19, "total_tokens": 1166793552} | |