diff --git "a/trainer_log.jsonl" "b/trainer_log.jsonl" new file mode 100644--- /dev/null +++ "b/trainer_log.jsonl" @@ -0,0 +1,1348 @@ +{"current_steps": 5, "total_steps": 134280, "loss": 1.0438, "lr": 1.4894250819183796e-08, "epoch": 0.0007447125409591898, "percentage": 0.0, "elapsed_time": "0:00:01", "remaining_time": "12:03:13", "throughput": 1663.14, "total_tokens": 2688} +{"current_steps": 10, "total_steps": 134280, "loss": 1.4509, "lr": 3.351206434316354e-08, "epoch": 0.0014894250819183796, "percentage": 0.01, "elapsed_time": "0:00:02", "remaining_time": "10:34:15", "throughput": 2066.13, "total_tokens": 5856} +{"current_steps": 15, "total_steps": 134280, "loss": 1.1626, "lr": 5.2129877867143284e-08, "epoch": 0.002234137622877569, "percentage": 0.01, "elapsed_time": "0:00:03", "remaining_time": "9:48:30", "throughput": 2157.72, "total_tokens": 8512} +{"current_steps": 20, "total_steps": 134280, "loss": 1.1287, "lr": 7.074769139112303e-08, "epoch": 0.002978850163836759, "percentage": 0.01, "elapsed_time": "0:00:05", "remaining_time": "9:26:03", "throughput": 2213.72, "total_tokens": 11200} +{"current_steps": 25, "total_steps": 134280, "loss": 1.2403, "lr": 8.936550491510277e-08, "epoch": 0.0037235627047959487, "percentage": 0.02, "elapsed_time": "0:00:06", "remaining_time": "9:22:46", "throughput": 2279.98, "total_tokens": 14336} +{"current_steps": 30, "total_steps": 134280, "loss": 1.1193, "lr": 1.0798331843908253e-07, "epoch": 0.004468275245755138, "percentage": 0.02, "elapsed_time": "0:00:07", "remaining_time": "9:21:10", "throughput": 2330.6, "total_tokens": 17536} +{"current_steps": 35, "total_steps": 134280, "loss": 1.2912, "lr": 1.2660113196306226e-07, "epoch": 0.005212987786714328, "percentage": 0.03, "elapsed_time": "0:00:08", "remaining_time": "9:20:40", "throughput": 2360.62, "total_tokens": 20704} +{"current_steps": 40, "total_steps": 134280, "loss": 1.0157, "lr": 1.45218945487042e-07, "epoch": 0.005957700327673518, "percentage": 0.03, "elapsed_time": "0:00:09", "remaining_time": "9:13:08", "throughput": 2381.55, "total_tokens": 23552} +{"current_steps": 45, "total_steps": 134280, "loss": 1.0662, "lr": 1.6383675901102174e-07, "epoch": 0.006702412868632708, "percentage": 0.03, "elapsed_time": "0:00:11", "remaining_time": "9:09:56", "throughput": 2398.2, "total_tokens": 26528} +{"current_steps": 50, "total_steps": 134280, "loss": 1.461, "lr": 1.824545725350015e-07, "epoch": 0.0074471254095918975, "percentage": 0.04, "elapsed_time": "0:00:12", "remaining_time": "9:03:05", "throughput": 2401.72, "total_tokens": 29152} +{"current_steps": 55, "total_steps": 134280, "loss": 1.3834, "lr": 2.0107238605898125e-07, "epoch": 0.008191837950551088, "percentage": 0.04, "elapsed_time": "0:00:13", "remaining_time": "8:58:32", "throughput": 2407.18, "total_tokens": 31872} +{"current_steps": 60, "total_steps": 134280, "loss": 1.0165, "lr": 2.1969019958296101e-07, "epoch": 0.008936550491510277, "percentage": 0.04, "elapsed_time": "0:00:14", "remaining_time": "8:57:01", "throughput": 2414.87, "total_tokens": 34784} +{"current_steps": 65, "total_steps": 134280, "loss": 1.2152, "lr": 2.3830801310694073e-07, "epoch": 0.009681263032469467, "percentage": 0.05, "elapsed_time": "0:00:15", "remaining_time": "8:55:04", "throughput": 2422.39, "total_tokens": 37664} +{"current_steps": 70, "total_steps": 134280, "loss": 1.7297, "lr": 2.569258266309205e-07, "epoch": 0.010425975573428656, "percentage": 0.05, "elapsed_time": "0:00:16", "remaining_time": "8:53:21", "throughput": 2427.2, "total_tokens": 40512} +{"current_steps": 75, "total_steps": 134280, "loss": 1.3359, "lr": 2.755436401549002e-07, "epoch": 0.011170688114387846, "percentage": 0.06, "elapsed_time": "0:00:17", "remaining_time": "8:52:30", "throughput": 2431.96, "total_tokens": 43424} +{"current_steps": 80, "total_steps": 134280, "loss": 1.1618, "lr": 2.9416145367888e-07, "epoch": 0.011915400655347037, "percentage": 0.06, "elapsed_time": "0:00:18", "remaining_time": "8:50:55", "throughput": 2433.32, "total_tokens": 46208} +{"current_steps": 85, "total_steps": 134280, "loss": 1.1754, "lr": 3.1277926720285975e-07, "epoch": 0.012660113196306225, "percentage": 0.06, "elapsed_time": "0:00:20", "remaining_time": "8:47:35", "throughput": 2435.4, "total_tokens": 48832} +{"current_steps": 90, "total_steps": 134280, "loss": 1.0431, "lr": 3.3139708072683946e-07, "epoch": 0.013404825737265416, "percentage": 0.07, "elapsed_time": "0:00:21", "remaining_time": "8:45:46", "throughput": 2438.05, "total_tokens": 51584} +{"current_steps": 95, "total_steps": 134280, "loss": 1.0679, "lr": 3.5001489425081923e-07, "epoch": 0.014149538278224605, "percentage": 0.07, "elapsed_time": "0:00:22", "remaining_time": "8:44:13", "throughput": 2441.49, "total_tokens": 54368} +{"current_steps": 100, "total_steps": 134280, "loss": 1.0747, "lr": 3.6863270777479894e-07, "epoch": 0.014894250819183795, "percentage": 0.07, "elapsed_time": "0:00:23", "remaining_time": "8:43:56", "throughput": 2443.49, "total_tokens": 57248} +{"current_steps": 105, "total_steps": 134280, "loss": 1.3667, "lr": 3.872505212987787e-07, "epoch": 0.015638963360142984, "percentage": 0.08, "elapsed_time": "0:00:24", "remaining_time": "8:45:04", "throughput": 2447.92, "total_tokens": 60352} +{"current_steps": 110, "total_steps": 134280, "loss": 1.2789, "lr": 4.058683348227585e-07, "epoch": 0.016383675901102176, "percentage": 0.08, "elapsed_time": "0:00:25", "remaining_time": "8:43:42", "throughput": 2448.29, "total_tokens": 63072} +{"current_steps": 115, "total_steps": 134280, "loss": 1.4066, "lr": 4.244861483467382e-07, "epoch": 0.017128388442061365, "percentage": 0.09, "elapsed_time": "0:00:26", "remaining_time": "8:42:43", "throughput": 2453.29, "total_tokens": 65952} +{"current_steps": 120, "total_steps": 134280, "loss": 0.9153, "lr": 4.431039618707179e-07, "epoch": 0.017873100983020553, "percentage": 0.09, "elapsed_time": "0:00:27", "remaining_time": "8:41:30", "throughput": 2453.65, "total_tokens": 68672} +{"current_steps": 125, "total_steps": 134280, "loss": 1.2409, "lr": 4.617217753946977e-07, "epoch": 0.018617813523979745, "percentage": 0.09, "elapsed_time": "0:00:29", "remaining_time": "8:40:49", "throughput": 2455.16, "total_tokens": 71488} +{"current_steps": 130, "total_steps": 134280, "loss": 1.1523, "lr": 4.803395889186774e-07, "epoch": 0.019362526064938934, "percentage": 0.1, "elapsed_time": "0:00:30", "remaining_time": "8:40:15", "throughput": 2456.38, "total_tokens": 74304} +{"current_steps": 135, "total_steps": 134280, "loss": 1.3362, "lr": 4.989574024426572e-07, "epoch": 0.020107238605898123, "percentage": 0.1, "elapsed_time": "0:00:31", "remaining_time": "8:39:40", "throughput": 2457.68, "total_tokens": 77120} +{"current_steps": 140, "total_steps": 134280, "loss": 1.0845, "lr": 5.17575215966637e-07, "epoch": 0.02085195114685731, "percentage": 0.1, "elapsed_time": "0:00:32", "remaining_time": "8:39:38", "throughput": 2458.45, "total_tokens": 80000} +{"current_steps": 145, "total_steps": 134280, "loss": 1.3448, "lr": 5.361930294906167e-07, "epoch": 0.021596663687816504, "percentage": 0.11, "elapsed_time": "0:00:33", "remaining_time": "8:39:39", "throughput": 2459.93, "total_tokens": 82912} +{"current_steps": 150, "total_steps": 134280, "loss": 1.1236, "lr": 5.548108430145964e-07, "epoch": 0.022341376228775692, "percentage": 0.11, "elapsed_time": "0:00:34", "remaining_time": "8:39:47", "throughput": 2460.69, "total_tokens": 85824} +{"current_steps": 155, "total_steps": 134280, "loss": 1.3071, "lr": 5.734286565385761e-07, "epoch": 0.02308608876973488, "percentage": 0.12, "elapsed_time": "0:00:36", "remaining_time": "8:39:25", "throughput": 2461.09, "total_tokens": 88640} +{"current_steps": 160, "total_steps": 134280, "loss": 1.2794, "lr": 5.920464700625559e-07, "epoch": 0.023830801310694073, "percentage": 0.12, "elapsed_time": "0:00:37", "remaining_time": "8:39:29", "throughput": 2462.98, "total_tokens": 91584} +{"current_steps": 165, "total_steps": 134280, "loss": 1.3167, "lr": 6.106642835865357e-07, "epoch": 0.024575513851653262, "percentage": 0.12, "elapsed_time": "0:00:38", "remaining_time": "8:39:38", "throughput": 2466.01, "total_tokens": 94592} +{"current_steps": 170, "total_steps": 134280, "loss": 1.342, "lr": 6.292820971105154e-07, "epoch": 0.02532022639261245, "percentage": 0.13, "elapsed_time": "0:00:39", "remaining_time": "8:40:20", "throughput": 2470.23, "total_tokens": 97760} +{"current_steps": 175, "total_steps": 134280, "loss": 1.2563, "lr": 6.478999106344952e-07, "epoch": 0.026064938933571643, "percentage": 0.13, "elapsed_time": "0:00:40", "remaining_time": "8:41:43", "throughput": 2471.55, "total_tokens": 100960} +{"current_steps": 180, "total_steps": 134280, "loss": 0.9274, "lr": 6.665177241584749e-07, "epoch": 0.02680965147453083, "percentage": 0.13, "elapsed_time": "0:00:42", "remaining_time": "8:43:21", "throughput": 2474.99, "total_tokens": 104320} +{"current_steps": 185, "total_steps": 134280, "loss": 0.9063, "lr": 6.851355376824546e-07, "epoch": 0.02755436401549002, "percentage": 0.14, "elapsed_time": "0:00:43", "remaining_time": "8:42:26", "throughput": 2474.35, "total_tokens": 107008} +{"current_steps": 190, "total_steps": 134280, "loss": 1.1456, "lr": 7.037533512064343e-07, "epoch": 0.02829907655644921, "percentage": 0.14, "elapsed_time": "0:00:44", "remaining_time": "8:42:32", "throughput": 2477.18, "total_tokens": 110048} +{"current_steps": 195, "total_steps": 134280, "loss": 0.9727, "lr": 7.223711647304142e-07, "epoch": 0.0290437890974084, "percentage": 0.15, "elapsed_time": "0:00:45", "remaining_time": "8:42:21", "throughput": 2476.9, "total_tokens": 112896} +{"current_steps": 200, "total_steps": 134280, "loss": 0.9092, "lr": 7.409889782543939e-07, "epoch": 0.02978850163836759, "percentage": 0.15, "elapsed_time": "0:00:46", "remaining_time": "8:43:43", "throughput": 2478.85, "total_tokens": 116192} +{"current_steps": 205, "total_steps": 134280, "loss": 1.1284, "lr": 7.596067917783736e-07, "epoch": 0.03053321417932678, "percentage": 0.15, "elapsed_time": "0:00:48", "remaining_time": "8:43:38", "throughput": 2481.32, "total_tokens": 119200} +{"current_steps": 210, "total_steps": 134280, "loss": 1.1307, "lr": 7.782246053023533e-07, "epoch": 0.03127792672028597, "percentage": 0.16, "elapsed_time": "0:00:49", "remaining_time": "8:43:43", "throughput": 2481.58, "total_tokens": 122144} +{"current_steps": 215, "total_steps": 134280, "loss": 1.3167, "lr": 7.96842418826333e-07, "epoch": 0.032022639261245156, "percentage": 0.16, "elapsed_time": "0:00:50", "remaining_time": "8:44:33", "throughput": 2482.66, "total_tokens": 125312} +{"current_steps": 220, "total_steps": 134280, "loss": 1.1237, "lr": 8.154602323503128e-07, "epoch": 0.03276735180220435, "percentage": 0.16, "elapsed_time": "0:00:51", "remaining_time": "8:44:07", "throughput": 2483.4, "total_tokens": 128160} +{"current_steps": 225, "total_steps": 134280, "loss": 1.1886, "lr": 8.340780458742925e-07, "epoch": 0.03351206434316354, "percentage": 0.17, "elapsed_time": "0:00:52", "remaining_time": "8:44:14", "throughput": 2484.5, "total_tokens": 131168} +{"current_steps": 230, "total_steps": 134280, "loss": 0.9799, "lr": 8.526958593982724e-07, "epoch": 0.03425677688412273, "percentage": 0.17, "elapsed_time": "0:00:53", "remaining_time": "8:43:31", "throughput": 2484.2, "total_tokens": 133888} +{"current_steps": 235, "total_steps": 134280, "loss": 0.8781, "lr": 8.713136729222521e-07, "epoch": 0.03500148942508192, "percentage": 0.18, "elapsed_time": "0:00:54", "remaining_time": "8:42:50", "throughput": 2483.95, "total_tokens": 136608} +{"current_steps": 240, "total_steps": 134280, "loss": 1.0926, "lr": 8.899314864462318e-07, "epoch": 0.035746201966041107, "percentage": 0.18, "elapsed_time": "0:00:56", "remaining_time": "8:43:13", "throughput": 2487.77, "total_tokens": 139840} +{"current_steps": 245, "total_steps": 134280, "loss": 1.0264, "lr": 9.085492999702115e-07, "epoch": 0.036490914507000295, "percentage": 0.18, "elapsed_time": "0:00:57", "remaining_time": "8:43:41", "throughput": 2491.07, "total_tokens": 143072} +{"current_steps": 250, "total_steps": 134280, "loss": 0.5904, "lr": 9.271671134941912e-07, "epoch": 0.03723562704795949, "percentage": 0.19, "elapsed_time": "0:00:58", "remaining_time": "8:43:26", "throughput": 2490.9, "total_tokens": 145920} +{"current_steps": 255, "total_steps": 134280, "loss": 0.866, "lr": 9.457849270181709e-07, "epoch": 0.03798033958891868, "percentage": 0.19, "elapsed_time": "0:00:59", "remaining_time": "8:43:56", "throughput": 2492.57, "total_tokens": 149088} +{"current_steps": 260, "total_steps": 134280, "loss": 1.0469, "lr": 9.644027405421507e-07, "epoch": 0.03872505212987787, "percentage": 0.19, "elapsed_time": "0:01:01", "remaining_time": "8:46:00", "throughput": 2494.04, "total_tokens": 152704} +{"current_steps": 265, "total_steps": 134280, "loss": 0.8658, "lr": 9.830205540661306e-07, "epoch": 0.03946976467083706, "percentage": 0.2, "elapsed_time": "0:01:02", "remaining_time": "8:45:31", "throughput": 2494.78, "total_tokens": 155552} +{"current_steps": 270, "total_steps": 134280, "loss": 1.1373, "lr": 1.0016383675901103e-06, "epoch": 0.040214477211796246, "percentage": 0.2, "elapsed_time": "0:01:03", "remaining_time": "8:45:25", "throughput": 2495.34, "total_tokens": 158496} +{"current_steps": 275, "total_steps": 134280, "loss": 1.0503, "lr": 1.02025618111409e-06, "epoch": 0.040959189752755434, "percentage": 0.2, "elapsed_time": "0:01:04", "remaining_time": "8:45:32", "throughput": 2496.34, "total_tokens": 161536} +{"current_steps": 280, "total_steps": 134280, "loss": 0.9215, "lr": 1.0388739946380697e-06, "epoch": 0.04170390229371462, "percentage": 0.21, "elapsed_time": "0:01:05", "remaining_time": "8:45:09", "throughput": 2496.71, "total_tokens": 164384} +{"current_steps": 285, "total_steps": 134280, "loss": 0.9587, "lr": 1.0574918081620494e-06, "epoch": 0.04244861483467382, "percentage": 0.21, "elapsed_time": "0:01:06", "remaining_time": "8:44:49", "throughput": 2496.44, "total_tokens": 167200} +{"current_steps": 290, "total_steps": 134280, "loss": 0.9346, "lr": 1.0761096216860292e-06, "epoch": 0.04319332737563301, "percentage": 0.22, "elapsed_time": "0:01:08", "remaining_time": "8:44:46", "throughput": 2497.63, "total_tokens": 170208} +{"current_steps": 295, "total_steps": 134280, "loss": 0.9133, "lr": 1.0947274352100089e-06, "epoch": 0.043938039916592196, "percentage": 0.22, "elapsed_time": "0:01:09", "remaining_time": "8:45:18", "throughput": 2498.82, "total_tokens": 173408} +{"current_steps": 300, "total_steps": 134280, "loss": 0.793, "lr": 1.1133452487339888e-06, "epoch": 0.044682752457551385, "percentage": 0.22, "elapsed_time": "0:01:10", "remaining_time": "8:44:39", "throughput": 2497.81, "total_tokens": 176064} +{"current_steps": 305, "total_steps": 134280, "loss": 0.7625, "lr": 1.1319630622579685e-06, "epoch": 0.045427464998510574, "percentage": 0.23, "elapsed_time": "0:01:11", "remaining_time": "8:44:13", "throughput": 2497.73, "total_tokens": 178848} +{"current_steps": 310, "total_steps": 134280, "loss": 0.8548, "lr": 1.1505808757819482e-06, "epoch": 0.04617217753946976, "percentage": 0.23, "elapsed_time": "0:01:12", "remaining_time": "8:44:15", "throughput": 2498.52, "total_tokens": 181856} +{"current_steps": 315, "total_steps": 134280, "loss": 0.74, "lr": 1.169198689305928e-06, "epoch": 0.04691689008042895, "percentage": 0.23, "elapsed_time": "0:01:13", "remaining_time": "8:44:18", "throughput": 2499.56, "total_tokens": 184896} +{"current_steps": 320, "total_steps": 134280, "loss": 0.8964, "lr": 1.1878165028299077e-06, "epoch": 0.04766160262138815, "percentage": 0.24, "elapsed_time": "0:01:15", "remaining_time": "8:44:02", "throughput": 2500.46, "total_tokens": 187808} +{"current_steps": 325, "total_steps": 134280, "loss": 0.6091, "lr": 1.2064343163538874e-06, "epoch": 0.048406315162347335, "percentage": 0.24, "elapsed_time": "0:01:16", "remaining_time": "8:44:13", "throughput": 2501.27, "total_tokens": 190880} +{"current_steps": 330, "total_steps": 134280, "loss": 1.0402, "lr": 1.2250521298778673e-06, "epoch": 0.049151027703306524, "percentage": 0.25, "elapsed_time": "0:01:17", "remaining_time": "8:43:33", "throughput": 2500.8, "total_tokens": 193536} +{"current_steps": 335, "total_steps": 134280, "loss": 1.0405, "lr": 1.243669943401847e-06, "epoch": 0.04989574024426571, "percentage": 0.25, "elapsed_time": "0:01:18", "remaining_time": "8:43:27", "throughput": 2500.9, "total_tokens": 196448} +{"current_steps": 340, "total_steps": 134280, "loss": 0.6042, "lr": 1.2622877569258267e-06, "epoch": 0.0506404527852249, "percentage": 0.25, "elapsed_time": "0:01:19", "remaining_time": "8:42:50", "throughput": 2500.67, "total_tokens": 199136} +{"current_steps": 345, "total_steps": 134280, "loss": 0.996, "lr": 1.2809055704498064e-06, "epoch": 0.05138516532618409, "percentage": 0.26, "elapsed_time": "0:01:20", "remaining_time": "8:43:00", "throughput": 2501.96, "total_tokens": 202240} +{"current_steps": 350, "total_steps": 134280, "loss": 0.7972, "lr": 1.2995233839737862e-06, "epoch": 0.052129877867143286, "percentage": 0.26, "elapsed_time": "0:01:21", "remaining_time": "8:42:29", "throughput": 2501.01, "total_tokens": 204896} +{"current_steps": 355, "total_steps": 134280, "loss": 0.8037, "lr": 1.3181411974977659e-06, "epoch": 0.052874590408102475, "percentage": 0.26, "elapsed_time": "0:01:23", "remaining_time": "8:41:52", "throughput": 2500.55, "total_tokens": 207552} +{"current_steps": 360, "total_steps": 134280, "loss": 0.7322, "lr": 1.3367590110217456e-06, "epoch": 0.05361930294906166, "percentage": 0.27, "elapsed_time": "0:01:24", "remaining_time": "8:41:18", "throughput": 2500.38, "total_tokens": 210240} +{"current_steps": 365, "total_steps": 134280, "loss": 0.6653, "lr": 1.3553768245457255e-06, "epoch": 0.05436401549002085, "percentage": 0.27, "elapsed_time": "0:01:25", "remaining_time": "8:41:04", "throughput": 2499.84, "total_tokens": 213024} +{"current_steps": 370, "total_steps": 134280, "loss": 0.6667, "lr": 1.3739946380697052e-06, "epoch": 0.05510872803098004, "percentage": 0.28, "elapsed_time": "0:01:26", "remaining_time": "8:40:48", "throughput": 2499.83, "total_tokens": 215840} +{"current_steps": 375, "total_steps": 134280, "loss": 0.7343, "lr": 1.392612451593685e-06, "epoch": 0.05585344057193923, "percentage": 0.28, "elapsed_time": "0:01:27", "remaining_time": "8:40:17", "throughput": 2499.64, "total_tokens": 218528} +{"current_steps": 380, "total_steps": 134280, "loss": 0.9279, "lr": 1.4112302651176647e-06, "epoch": 0.05659815311289842, "percentage": 0.28, "elapsed_time": "0:01:28", "remaining_time": "8:41:11", "throughput": 2499.5, "total_tokens": 221824} +{"current_steps": 385, "total_steps": 134280, "loss": 0.6518, "lr": 1.4298480786416444e-06, "epoch": 0.057342865653857614, "percentage": 0.29, "elapsed_time": "0:01:29", "remaining_time": "8:40:50", "throughput": 2498.22, "total_tokens": 224480} +{"current_steps": 390, "total_steps": 134280, "loss": 0.6231, "lr": 1.448465892165624e-06, "epoch": 0.0580875781948168, "percentage": 0.29, "elapsed_time": "0:01:30", "remaining_time": "8:40:38", "throughput": 2497.99, "total_tokens": 227296} +{"current_steps": 395, "total_steps": 134280, "loss": 0.8925, "lr": 1.4670837056896038e-06, "epoch": 0.05883229073577599, "percentage": 0.29, "elapsed_time": "0:01:32", "remaining_time": "8:40:05", "throughput": 2497.36, "total_tokens": 229920} +{"current_steps": 400, "total_steps": 134280, "loss": 0.6556, "lr": 1.4857015192135837e-06, "epoch": 0.05957700327673518, "percentage": 0.3, "elapsed_time": "0:01:33", "remaining_time": "8:39:32", "throughput": 2496.5, "total_tokens": 232512} +{"current_steps": 405, "total_steps": 134280, "loss": 0.799, "lr": 1.5043193327375634e-06, "epoch": 0.06032171581769437, "percentage": 0.3, "elapsed_time": "0:01:34", "remaining_time": "8:39:41", "throughput": 2497.41, "total_tokens": 235584} +{"current_steps": 410, "total_steps": 134280, "loss": 0.9613, "lr": 1.5229371462615432e-06, "epoch": 0.06106642835865356, "percentage": 0.31, "elapsed_time": "0:01:35", "remaining_time": "8:39:39", "throughput": 2497.53, "total_tokens": 238496} +{"current_steps": 415, "total_steps": 134280, "loss": 0.7163, "lr": 1.5415549597855229e-06, "epoch": 0.06181114089961275, "percentage": 0.31, "elapsed_time": "0:01:36", "remaining_time": "8:39:36", "throughput": 2497.4, "total_tokens": 241376} +{"current_steps": 420, "total_steps": 134280, "loss": 0.7431, "lr": 1.5601727733095026e-06, "epoch": 0.06255585344057193, "percentage": 0.31, "elapsed_time": "0:01:37", "remaining_time": "8:39:35", "throughput": 2497.72, "total_tokens": 244320} +{"current_steps": 425, "total_steps": 134280, "loss": 0.9822, "lr": 1.5787905868334823e-06, "epoch": 0.06330056598153112, "percentage": 0.32, "elapsed_time": "0:01:39", "remaining_time": "8:40:02", "throughput": 2498.07, "total_tokens": 247488} +{"current_steps": 430, "total_steps": 134280, "loss": 1.0591, "lr": 1.597408400357462e-06, "epoch": 0.06404527852249031, "percentage": 0.32, "elapsed_time": "0:01:40", "remaining_time": "8:39:41", "throughput": 2497.76, "total_tokens": 250208} +{"current_steps": 435, "total_steps": 134280, "loss": 0.803, "lr": 1.6160262138814417e-06, "epoch": 0.06478999106344951, "percentage": 0.32, "elapsed_time": "0:01:41", "remaining_time": "8:39:39", "throughput": 2497.85, "total_tokens": 253120} +{"current_steps": 440, "total_steps": 134280, "loss": 0.6733, "lr": 1.6346440274054214e-06, "epoch": 0.0655347036044087, "percentage": 0.33, "elapsed_time": "0:01:42", "remaining_time": "8:39:37", "throughput": 2497.93, "total_tokens": 256032} +{"current_steps": 445, "total_steps": 134280, "loss": 0.9301, "lr": 1.6532618409294012e-06, "epoch": 0.06627941614536789, "percentage": 0.33, "elapsed_time": "0:01:43", "remaining_time": "8:39:32", "throughput": 2497.99, "total_tokens": 258912} +{"current_steps": 450, "total_steps": 134280, "loss": 0.7574, "lr": 1.6718796544533813e-06, "epoch": 0.06702412868632708, "percentage": 0.34, "elapsed_time": "0:01:44", "remaining_time": "8:39:15", "throughput": 2498.35, "total_tokens": 261728} +{"current_steps": 455, "total_steps": 134280, "loss": 0.6012, "lr": 1.690497467977361e-06, "epoch": 0.06776884122728627, "percentage": 0.34, "elapsed_time": "0:01:45", "remaining_time": "8:39:17", "throughput": 2497.85, "total_tokens": 264608} +{"current_steps": 460, "total_steps": 134280, "loss": 0.7136, "lr": 1.7091152815013407e-06, "epoch": 0.06851355376824546, "percentage": 0.34, "elapsed_time": "0:01:47", "remaining_time": "8:39:41", "throughput": 2497.96, "total_tokens": 267744} +{"current_steps": 465, "total_steps": 134280, "loss": 0.7868, "lr": 1.7277330950253204e-06, "epoch": 0.06925826630920465, "percentage": 0.35, "elapsed_time": "0:01:48", "remaining_time": "8:40:05", "throughput": 2498.3, "total_tokens": 270912} +{"current_steps": 470, "total_steps": 134280, "loss": 0.9032, "lr": 1.7463509085493002e-06, "epoch": 0.07000297885016384, "percentage": 0.35, "elapsed_time": "0:01:49", "remaining_time": "8:40:03", "throughput": 2498.37, "total_tokens": 273824} +{"current_steps": 475, "total_steps": 134280, "loss": 0.7897, "lr": 1.7649687220732799e-06, "epoch": 0.07074769139112302, "percentage": 0.35, "elapsed_time": "0:01:50", "remaining_time": "8:40:15", "throughput": 2499.34, "total_tokens": 276960} +{"current_steps": 480, "total_steps": 134280, "loss": 0.6496, "lr": 1.7835865355972596e-06, "epoch": 0.07149240393208221, "percentage": 0.36, "elapsed_time": "0:01:51", "remaining_time": "8:39:56", "throughput": 2499.27, "total_tokens": 279712} +{"current_steps": 485, "total_steps": 134280, "loss": 0.7436, "lr": 1.8022043491212393e-06, "epoch": 0.0722371164730414, "percentage": 0.36, "elapsed_time": "0:01:53", "remaining_time": "8:39:47", "throughput": 2499.66, "total_tokens": 282592} +{"current_steps": 490, "total_steps": 134280, "loss": 0.9846, "lr": 1.820822162645219e-06, "epoch": 0.07298182901400059, "percentage": 0.36, "elapsed_time": "0:01:54", "remaining_time": "8:39:41", "throughput": 2499.73, "total_tokens": 285472} +{"current_steps": 495, "total_steps": 134280, "loss": 0.6809, "lr": 1.8394399761691987e-06, "epoch": 0.07372654155495978, "percentage": 0.37, "elapsed_time": "0:01:55", "remaining_time": "8:39:49", "throughput": 2500.38, "total_tokens": 288544} +{"current_steps": 500, "total_steps": 134280, "loss": 0.7028, "lr": 1.8580577896931784e-06, "epoch": 0.07447125409591898, "percentage": 0.37, "elapsed_time": "0:01:56", "remaining_time": "8:39:47", "throughput": 2501.21, "total_tokens": 291552} +{"current_steps": 505, "total_steps": 134280, "loss": 0.7074, "lr": 1.8766756032171582e-06, "epoch": 0.07521596663687817, "percentage": 0.38, "elapsed_time": "0:01:57", "remaining_time": "8:39:51", "throughput": 2500.57, "total_tokens": 294432} +{"current_steps": 510, "total_steps": 134280, "loss": 0.7605, "lr": 1.8952934167411379e-06, "epoch": 0.07596067917783736, "percentage": 0.38, "elapsed_time": "0:01:58", "remaining_time": "8:39:42", "throughput": 2501.12, "total_tokens": 297344} +{"current_steps": 515, "total_steps": 134280, "loss": 0.8859, "lr": 1.913911230265118e-06, "epoch": 0.07670539171879655, "percentage": 0.38, "elapsed_time": "0:02:00", "remaining_time": "8:39:49", "throughput": 2501.77, "total_tokens": 300416} +{"current_steps": 520, "total_steps": 134280, "loss": 0.7464, "lr": 1.9325290437890977e-06, "epoch": 0.07745010425975574, "percentage": 0.39, "elapsed_time": "0:02:01", "remaining_time": "8:39:59", "throughput": 2502.44, "total_tokens": 303520} +{"current_steps": 525, "total_steps": 134280, "loss": 0.6822, "lr": 1.9511468573130772e-06, "epoch": 0.07819481680071493, "percentage": 0.39, "elapsed_time": "0:02:02", "remaining_time": "8:39:36", "throughput": 2502.29, "total_tokens": 306208} +{"current_steps": 530, "total_steps": 134280, "loss": 0.8026, "lr": 1.969764670837057e-06, "epoch": 0.07893952934167411, "percentage": 0.39, "elapsed_time": "0:02:03", "remaining_time": "8:40:02", "throughput": 2503.22, "total_tokens": 309504} +{"current_steps": 535, "total_steps": 134280, "loss": 0.7687, "lr": 1.9883824843610367e-06, "epoch": 0.0796842418826333, "percentage": 0.4, "elapsed_time": "0:02:04", "remaining_time": "8:39:52", "throughput": 2503.55, "total_tokens": 312384} +{"current_steps": 540, "total_steps": 134280, "loss": 0.8412, "lr": 2.0070002978850166e-06, "epoch": 0.08042895442359249, "percentage": 0.4, "elapsed_time": "0:02:05", "remaining_time": "8:39:34", "throughput": 2503.1, "total_tokens": 315072} +{"current_steps": 545, "total_steps": 134280, "loss": 0.8303, "lr": 2.025618111408996e-06, "epoch": 0.08117366696455168, "percentage": 0.41, "elapsed_time": "0:02:07", "remaining_time": "8:39:35", "throughput": 2503.62, "total_tokens": 318080} +{"current_steps": 550, "total_steps": 134280, "loss": 0.7719, "lr": 2.044235924932976e-06, "epoch": 0.08191837950551087, "percentage": 0.41, "elapsed_time": "0:02:08", "remaining_time": "8:39:27", "throughput": 2503.92, "total_tokens": 320960} +{"current_steps": 555, "total_steps": 134280, "loss": 0.8099, "lr": 2.0628537384569555e-06, "epoch": 0.08266309204647006, "percentage": 0.41, "elapsed_time": "0:02:09", "remaining_time": "8:39:42", "throughput": 2504.78, "total_tokens": 324160} +{"current_steps": 560, "total_steps": 134280, "loss": 0.749, "lr": 2.0814715519809354e-06, "epoch": 0.08340780458742925, "percentage": 0.42, "elapsed_time": "0:02:10", "remaining_time": "8:39:22", "throughput": 2503.98, "total_tokens": 326784} +{"current_steps": 565, "total_steps": 134280, "loss": 0.6714, "lr": 2.100089365504915e-06, "epoch": 0.08415251712838845, "percentage": 0.42, "elapsed_time": "0:02:11", "remaining_time": "8:39:19", "throughput": 2504.13, "total_tokens": 329696} +{"current_steps": 570, "total_steps": 134280, "loss": 0.7716, "lr": 2.118707179028895e-06, "epoch": 0.08489722966934764, "percentage": 0.42, "elapsed_time": "0:02:13", "remaining_time": "8:40:08", "throughput": 2505.08, "total_tokens": 333280} +{"current_steps": 575, "total_steps": 134280, "loss": 0.8009, "lr": 2.1373249925528744e-06, "epoch": 0.08564194221030683, "percentage": 0.43, "elapsed_time": "0:02:14", "remaining_time": "8:40:02", "throughput": 2505.2, "total_tokens": 336160} +{"current_steps": 580, "total_steps": 134280, "loss": 0.6427, "lr": 2.1559428060768547e-06, "epoch": 0.08638665475126601, "percentage": 0.43, "elapsed_time": "0:02:15", "remaining_time": "8:39:51", "throughput": 2504.49, "total_tokens": 338880} +{"current_steps": 585, "total_steps": 134280, "loss": 0.7976, "lr": 2.1745606196008342e-06, "epoch": 0.0871313672922252, "percentage": 0.44, "elapsed_time": "0:02:16", "remaining_time": "8:39:46", "throughput": 2504.93, "total_tokens": 341824} +{"current_steps": 590, "total_steps": 134280, "loss": 0.696, "lr": 2.193178433124814e-06, "epoch": 0.08787607983318439, "percentage": 0.44, "elapsed_time": "0:02:17", "remaining_time": "8:39:39", "throughput": 2504.88, "total_tokens": 344672} +{"current_steps": 595, "total_steps": 134280, "loss": 0.6415, "lr": 2.2117962466487937e-06, "epoch": 0.08862079237414358, "percentage": 0.44, "elapsed_time": "0:02:18", "remaining_time": "8:39:29", "throughput": 2504.35, "total_tokens": 347424} +{"current_steps": 600, "total_steps": 134280, "loss": 0.7075, "lr": 2.2304140601727736e-06, "epoch": 0.08936550491510277, "percentage": 0.45, "elapsed_time": "0:02:19", "remaining_time": "8:39:20", "throughput": 2504.44, "total_tokens": 350272} +{"current_steps": 605, "total_steps": 134280, "loss": 0.7014, "lr": 2.249031873696753e-06, "epoch": 0.09011021745606196, "percentage": 0.45, "elapsed_time": "0:02:21", "remaining_time": "8:39:18", "throughput": 2504.93, "total_tokens": 353248} +{"current_steps": 610, "total_steps": 134280, "loss": 0.7308, "lr": 2.267649687220733e-06, "epoch": 0.09085492999702115, "percentage": 0.45, "elapsed_time": "0:02:22", "remaining_time": "8:39:11", "throughput": 2504.89, "total_tokens": 356096} +{"current_steps": 615, "total_steps": 134280, "loss": 0.8127, "lr": 2.2862675007447125e-06, "epoch": 0.09159964253798034, "percentage": 0.46, "elapsed_time": "0:02:23", "remaining_time": "8:38:57", "throughput": 2504.32, "total_tokens": 358784} +{"current_steps": 620, "total_steps": 134280, "loss": 0.7339, "lr": 2.3048853142686924e-06, "epoch": 0.09234435507893952, "percentage": 0.46, "elapsed_time": "0:02:24", "remaining_time": "8:38:43", "throughput": 2504.24, "total_tokens": 361536} +{"current_steps": 625, "total_steps": 134280, "loss": 0.81, "lr": 2.323503127792672e-06, "epoch": 0.09308906761989871, "percentage": 0.47, "elapsed_time": "0:02:25", "remaining_time": "8:38:43", "throughput": 2504.54, "total_tokens": 364512} +{"current_steps": 630, "total_steps": 134280, "loss": 0.5694, "lr": 2.342120941316652e-06, "epoch": 0.0938337801608579, "percentage": 0.47, "elapsed_time": "0:02:26", "remaining_time": "8:38:42", "throughput": 2504.54, "total_tokens": 367424} +{"current_steps": 635, "total_steps": 134280, "loss": 0.7141, "lr": 2.3607387548406314e-06, "epoch": 0.0945784927018171, "percentage": 0.47, "elapsed_time": "0:02:27", "remaining_time": "8:38:35", "throughput": 2504.09, "total_tokens": 370208} +{"current_steps": 640, "total_steps": 134280, "loss": 0.8454, "lr": 2.3793565683646113e-06, "epoch": 0.0953232052427763, "percentage": 0.48, "elapsed_time": "0:02:29", "remaining_time": "8:38:37", "throughput": 2504.7, "total_tokens": 373248} +{"current_steps": 645, "total_steps": 134280, "loss": 0.8899, "lr": 2.3979743818885912e-06, "epoch": 0.09606791778373548, "percentage": 0.48, "elapsed_time": "0:02:30", "remaining_time": "8:38:36", "throughput": 2504.85, "total_tokens": 376192} +{"current_steps": 650, "total_steps": 134280, "loss": 0.7172, "lr": 2.416592195412571e-06, "epoch": 0.09681263032469467, "percentage": 0.48, "elapsed_time": "0:02:31", "remaining_time": "8:38:22", "throughput": 2504.54, "total_tokens": 378912} +{"current_steps": 655, "total_steps": 134280, "loss": 0.7742, "lr": 2.4352100089365507e-06, "epoch": 0.09755734286565386, "percentage": 0.49, "elapsed_time": "0:02:32", "remaining_time": "8:38:27", "throughput": 2505.13, "total_tokens": 381984} +{"current_steps": 660, "total_steps": 134280, "loss": 0.9877, "lr": 2.4538278224605306e-06, "epoch": 0.09830205540661305, "percentage": 0.49, "elapsed_time": "0:02:33", "remaining_time": "8:38:23", "throughput": 2504.72, "total_tokens": 384800} +{"current_steps": 665, "total_steps": 134280, "loss": 0.7495, "lr": 2.47244563598451e-06, "epoch": 0.09904676794757224, "percentage": 0.5, "elapsed_time": "0:02:34", "remaining_time": "8:38:18", "throughput": 2504.97, "total_tokens": 387712} +{"current_steps": 670, "total_steps": 134280, "loss": 0.6759, "lr": 2.49106344950849e-06, "epoch": 0.09979148048853143, "percentage": 0.5, "elapsed_time": "0:02:35", "remaining_time": "8:38:20", "throughput": 2504.88, "total_tokens": 390656} +{"current_steps": 675, "total_steps": 134280, "loss": 0.8335, "lr": 2.5096812630324695e-06, "epoch": 0.10053619302949061, "percentage": 0.5, "elapsed_time": "0:02:37", "remaining_time": "8:38:14", "throughput": 2504.84, "total_tokens": 393504} +{"current_steps": 680, "total_steps": 134280, "loss": 0.6444, "lr": 2.5282990765564494e-06, "epoch": 0.1012809055704498, "percentage": 0.51, "elapsed_time": "0:02:38", "remaining_time": "8:38:02", "throughput": 2504.75, "total_tokens": 396256} +{"current_steps": 685, "total_steps": 134280, "loss": 0.6714, "lr": 2.546916890080429e-06, "epoch": 0.10202561811140899, "percentage": 0.51, "elapsed_time": "0:02:39", "remaining_time": "8:38:13", "throughput": 2504.75, "total_tokens": 399328} +{"current_steps": 690, "total_steps": 134280, "loss": 0.7426, "lr": 2.565534703604409e-06, "epoch": 0.10277033065236818, "percentage": 0.51, "elapsed_time": "0:02:40", "remaining_time": "8:38:03", "throughput": 2504.42, "total_tokens": 402080} +{"current_steps": 695, "total_steps": 134280, "loss": 0.7907, "lr": 2.5841525171283884e-06, "epoch": 0.10351504319332737, "percentage": 0.52, "elapsed_time": "0:02:41", "remaining_time": "8:37:56", "throughput": 2504.25, "total_tokens": 404896} +{"current_steps": 700, "total_steps": 134280, "loss": 0.8646, "lr": 2.6027703306523683e-06, "epoch": 0.10425975573428657, "percentage": 0.52, "elapsed_time": "0:02:42", "remaining_time": "8:37:42", "throughput": 2503.76, "total_tokens": 407552} +{"current_steps": 705, "total_steps": 134280, "loss": 0.8856, "lr": 2.621388144176348e-06, "epoch": 0.10500446827524576, "percentage": 0.53, "elapsed_time": "0:02:43", "remaining_time": "8:37:46", "throughput": 2504.08, "total_tokens": 410592} +{"current_steps": 710, "total_steps": 134280, "loss": 0.771, "lr": 2.6400059577003277e-06, "epoch": 0.10574918081620495, "percentage": 0.53, "elapsed_time": "0:02:45", "remaining_time": "8:37:37", "throughput": 2504.0, "total_tokens": 413376} +{"current_steps": 715, "total_steps": 134280, "loss": 0.6754, "lr": 2.6586237712243077e-06, "epoch": 0.10649389335716414, "percentage": 0.53, "elapsed_time": "0:02:46", "remaining_time": "8:37:28", "throughput": 2503.84, "total_tokens": 416160} +{"current_steps": 720, "total_steps": 134280, "loss": 0.7609, "lr": 2.6772415847482876e-06, "epoch": 0.10723860589812333, "percentage": 0.54, "elapsed_time": "0:02:47", "remaining_time": "8:37:33", "throughput": 2503.92, "total_tokens": 419168} +{"current_steps": 725, "total_steps": 134280, "loss": 0.6979, "lr": 2.695859398272267e-06, "epoch": 0.10798331843908252, "percentage": 0.54, "elapsed_time": "0:02:48", "remaining_time": "8:37:30", "throughput": 2504.27, "total_tokens": 422112} +{"current_steps": 730, "total_steps": 134280, "loss": 0.9066, "lr": 2.714477211796247e-06, "epoch": 0.1087280309800417, "percentage": 0.54, "elapsed_time": "0:02:49", "remaining_time": "8:37:23", "throughput": 2504.37, "total_tokens": 424960} +{"current_steps": 735, "total_steps": 134280, "loss": 0.7535, "lr": 2.7330950253202265e-06, "epoch": 0.10947274352100089, "percentage": 0.55, "elapsed_time": "0:02:50", "remaining_time": "8:37:17", "throughput": 2504.73, "total_tokens": 427872} +{"current_steps": 740, "total_steps": 134280, "loss": 0.7038, "lr": 2.7517128388442064e-06, "epoch": 0.11021745606196008, "percentage": 0.55, "elapsed_time": "0:02:52", "remaining_time": "8:37:24", "throughput": 2505.42, "total_tokens": 431008} +{"current_steps": 745, "total_steps": 134280, "loss": 0.7445, "lr": 2.770330652368186e-06, "epoch": 0.11096216860291927, "percentage": 0.55, "elapsed_time": "0:02:53", "remaining_time": "8:37:23", "throughput": 2505.93, "total_tokens": 434016} +{"current_steps": 750, "total_steps": 134280, "loss": 0.6516, "lr": 2.788948465892166e-06, "epoch": 0.11170688114387846, "percentage": 0.56, "elapsed_time": "0:02:54", "remaining_time": "8:37:14", "throughput": 2505.5, "total_tokens": 436736} +{"current_steps": 755, "total_steps": 134280, "loss": 0.7345, "lr": 2.8075662794161454e-06, "epoch": 0.11245159368483765, "percentage": 0.56, "elapsed_time": "0:02:55", "remaining_time": "8:37:18", "throughput": 2505.79, "total_tokens": 439776} +{"current_steps": 760, "total_steps": 134280, "loss": 0.7247, "lr": 2.8261840929401253e-06, "epoch": 0.11319630622579684, "percentage": 0.57, "elapsed_time": "0:02:56", "remaining_time": "8:37:11", "throughput": 2505.75, "total_tokens": 442592} +{"current_steps": 765, "total_steps": 134280, "loss": 0.709, "lr": 2.844801906464105e-06, "epoch": 0.11394101876675604, "percentage": 0.57, "elapsed_time": "0:02:57", "remaining_time": "8:37:11", "throughput": 2505.99, "total_tokens": 445568} +{"current_steps": 770, "total_steps": 134280, "loss": 0.818, "lr": 2.8634197199880847e-06, "epoch": 0.11468573130771523, "percentage": 0.57, "elapsed_time": "0:02:58", "remaining_time": "8:37:10", "throughput": 2505.99, "total_tokens": 448480} +{"current_steps": 775, "total_steps": 134280, "loss": 0.7635, "lr": 2.8820375335120642e-06, "epoch": 0.11543044384867442, "percentage": 0.58, "elapsed_time": "0:03:00", "remaining_time": "8:36:58", "throughput": 2505.65, "total_tokens": 451168} +{"current_steps": 780, "total_steps": 134280, "loss": 0.7071, "lr": 2.9006553470360446e-06, "epoch": 0.1161751563896336, "percentage": 0.58, "elapsed_time": "0:03:01", "remaining_time": "8:37:18", "throughput": 2506.18, "total_tokens": 454496} +{"current_steps": 785, "total_steps": 134280, "loss": 0.7652, "lr": 2.919273160560024e-06, "epoch": 0.1169198689305928, "percentage": 0.58, "elapsed_time": "0:03:02", "remaining_time": "8:37:36", "throughput": 2506.92, "total_tokens": 457824} +{"current_steps": 790, "total_steps": 134280, "loss": 0.7412, "lr": 2.937890974084004e-06, "epoch": 0.11766458147155198, "percentage": 0.59, "elapsed_time": "0:03:03", "remaining_time": "8:37:35", "throughput": 2507.03, "total_tokens": 460768} +{"current_steps": 795, "total_steps": 134280, "loss": 0.7525, "lr": 2.9565087876079835e-06, "epoch": 0.11840929401251117, "percentage": 0.59, "elapsed_time": "0:03:04", "remaining_time": "8:37:31", "throughput": 2507.24, "total_tokens": 463680} +{"current_steps": 800, "total_steps": 134280, "loss": 0.8386, "lr": 2.9751266011319634e-06, "epoch": 0.11915400655347036, "percentage": 0.6, "elapsed_time": "0:03:06", "remaining_time": "8:37:31", "throughput": 2507.33, "total_tokens": 466624} +{"current_steps": 805, "total_steps": 134280, "loss": 0.734, "lr": 2.993744414655943e-06, "epoch": 0.11989871909442955, "percentage": 0.6, "elapsed_time": "0:03:07", "remaining_time": "8:37:28", "throughput": 2507.65, "total_tokens": 469568} +{"current_steps": 810, "total_steps": 134280, "loss": 0.7521, "lr": 3.012362228179923e-06, "epoch": 0.12064343163538874, "percentage": 0.6, "elapsed_time": "0:03:08", "remaining_time": "8:37:17", "throughput": 2507.68, "total_tokens": 472352} +{"current_steps": 815, "total_steps": 134280, "loss": 0.8272, "lr": 3.0309800417039024e-06, "epoch": 0.12138814417634793, "percentage": 0.61, "elapsed_time": "0:03:09", "remaining_time": "8:37:50", "throughput": 2508.11, "total_tokens": 475872} +{"current_steps": 820, "total_steps": 134280, "loss": 0.6034, "lr": 3.0495978552278823e-06, "epoch": 0.12213285671730711, "percentage": 0.61, "elapsed_time": "0:03:10", "remaining_time": "8:37:55", "throughput": 2508.25, "total_tokens": 478912} +{"current_steps": 825, "total_steps": 134280, "loss": 0.7202, "lr": 3.068215668751862e-06, "epoch": 0.1228775692582663, "percentage": 0.61, "elapsed_time": "0:03:12", "remaining_time": "8:37:41", "throughput": 2508.11, "total_tokens": 481600} +{"current_steps": 830, "total_steps": 134280, "loss": 0.7328, "lr": 3.0868334822758417e-06, "epoch": 0.1236222817992255, "percentage": 0.62, "elapsed_time": "0:03:13", "remaining_time": "8:37:41", "throughput": 2508.31, "total_tokens": 484576} +{"current_steps": 835, "total_steps": 134280, "loss": 0.6931, "lr": 3.1054512957998212e-06, "epoch": 0.1243669943401847, "percentage": 0.62, "elapsed_time": "0:03:14", "remaining_time": "8:37:42", "throughput": 2508.22, "total_tokens": 487520} +{"current_steps": 840, "total_steps": 134280, "loss": 0.6983, "lr": 3.124069109323801e-06, "epoch": 0.12511170688114387, "percentage": 0.63, "elapsed_time": "0:03:15", "remaining_time": "8:37:42", "throughput": 2508.43, "total_tokens": 490496} +{"current_steps": 845, "total_steps": 134280, "loss": 0.71, "lr": 3.142686922847781e-06, "epoch": 0.12585641942210307, "percentage": 0.63, "elapsed_time": "0:03:16", "remaining_time": "8:37:38", "throughput": 2508.6, "total_tokens": 493408} +{"current_steps": 850, "total_steps": 134280, "loss": 0.8181, "lr": 3.1613047363717606e-06, "epoch": 0.12660113196306225, "percentage": 0.63, "elapsed_time": "0:03:17", "remaining_time": "8:37:27", "throughput": 2508.23, "total_tokens": 496096} +{"current_steps": 855, "total_steps": 134280, "loss": 0.6536, "lr": 3.1799225498957405e-06, "epoch": 0.12734584450402145, "percentage": 0.64, "elapsed_time": "0:03:18", "remaining_time": "8:37:18", "throughput": 2508.38, "total_tokens": 498912} +{"current_steps": 860, "total_steps": 134280, "loss": 0.7174, "lr": 3.19854036341972e-06, "epoch": 0.12809055704498062, "percentage": 0.64, "elapsed_time": "0:03:20", "remaining_time": "8:37:14", "throughput": 2508.76, "total_tokens": 501856} +{"current_steps": 865, "total_steps": 134280, "loss": 0.7349, "lr": 3.2171581769437e-06, "epoch": 0.12883526958593983, "percentage": 0.64, "elapsed_time": "0:03:21", "remaining_time": "8:37:12", "throughput": 2508.61, "total_tokens": 504736} +{"current_steps": 870, "total_steps": 134280, "loss": 0.7201, "lr": 3.2357759904676794e-06, "epoch": 0.12957998212689903, "percentage": 0.65, "elapsed_time": "0:03:22", "remaining_time": "8:37:02", "throughput": 2508.4, "total_tokens": 507456} +{"current_steps": 875, "total_steps": 134280, "loss": 0.8526, "lr": 3.2543938039916594e-06, "epoch": 0.1303246946678582, "percentage": 0.65, "elapsed_time": "0:03:23", "remaining_time": "8:37:04", "throughput": 2508.41, "total_tokens": 510432} +{"current_steps": 880, "total_steps": 134280, "loss": 0.7576, "lr": 3.2730116175156393e-06, "epoch": 0.1310694072088174, "percentage": 0.66, "elapsed_time": "0:03:24", "remaining_time": "8:36:55", "throughput": 2508.42, "total_tokens": 513216} +{"current_steps": 885, "total_steps": 134280, "loss": 0.7103, "lr": 3.291629431039619e-06, "epoch": 0.13181411974977658, "percentage": 0.66, "elapsed_time": "0:03:25", "remaining_time": "8:36:57", "throughput": 2508.72, "total_tokens": 516256} +{"current_steps": 890, "total_steps": 134280, "loss": 0.7738, "lr": 3.3102472445635987e-06, "epoch": 0.13255883229073578, "percentage": 0.66, "elapsed_time": "0:03:26", "remaining_time": "8:36:58", "throughput": 2509.14, "total_tokens": 519296} +{"current_steps": 895, "total_steps": 134280, "loss": 0.6948, "lr": 3.3288650580875782e-06, "epoch": 0.13330354483169496, "percentage": 0.67, "elapsed_time": "0:03:28", "remaining_time": "8:36:54", "throughput": 2508.89, "total_tokens": 522112} +{"current_steps": 900, "total_steps": 134280, "loss": 0.7708, "lr": 3.347482871611558e-06, "epoch": 0.13404825737265416, "percentage": 0.67, "elapsed_time": "0:03:29", "remaining_time": "8:37:05", "throughput": 2509.57, "total_tokens": 525376} +{"current_steps": 905, "total_steps": 134280, "loss": 0.713, "lr": 3.3661006851355377e-06, "epoch": 0.13479296991361334, "percentage": 0.67, "elapsed_time": "0:03:30", "remaining_time": "8:36:56", "throughput": 2509.69, "total_tokens": 528192} +{"current_steps": 910, "total_steps": 134280, "loss": 0.8305, "lr": 3.3847184986595176e-06, "epoch": 0.13553768245457254, "percentage": 0.68, "elapsed_time": "0:03:31", "remaining_time": "8:36:59", "throughput": 2509.49, "total_tokens": 531136} +{"current_steps": 915, "total_steps": 134280, "loss": 0.8253, "lr": 3.403336312183497e-06, "epoch": 0.1362823949955317, "percentage": 0.68, "elapsed_time": "0:03:32", "remaining_time": "8:36:56", "throughput": 2510.06, "total_tokens": 534144} +{"current_steps": 920, "total_steps": 134280, "loss": 0.7497, "lr": 3.421954125707477e-06, "epoch": 0.13702710753649092, "percentage": 0.69, "elapsed_time": "0:03:33", "remaining_time": "8:36:46", "throughput": 2509.75, "total_tokens": 536832} +{"current_steps": 925, "total_steps": 134280, "loss": 0.7402, "lr": 3.4405719392314565e-06, "epoch": 0.1377718200774501, "percentage": 0.69, "elapsed_time": "0:03:34", "remaining_time": "8:36:27", "throughput": 2509.17, "total_tokens": 539328} +{"current_steps": 930, "total_steps": 134280, "loss": 0.7204, "lr": 3.4591897527554364e-06, "epoch": 0.1385165326184093, "percentage": 0.69, "elapsed_time": "0:03:36", "remaining_time": "8:36:23", "throughput": 2509.24, "total_tokens": 542208} +{"current_steps": 935, "total_steps": 134280, "loss": 0.5514, "lr": 3.477807566279416e-06, "epoch": 0.1392612451593685, "percentage": 0.7, "elapsed_time": "0:03:37", "remaining_time": "8:36:19", "throughput": 2509.3, "total_tokens": 545088} +{"current_steps": 940, "total_steps": 134280, "loss": 0.7182, "lr": 3.496425379803396e-06, "epoch": 0.14000595770032767, "percentage": 0.7, "elapsed_time": "0:03:38", "remaining_time": "8:36:10", "throughput": 2508.91, "total_tokens": 547776} +{"current_steps": 945, "total_steps": 134280, "loss": 0.7178, "lr": 3.5150431933273762e-06, "epoch": 0.14075067024128687, "percentage": 0.7, "elapsed_time": "0:03:39", "remaining_time": "8:35:57", "throughput": 2508.57, "total_tokens": 550400} +{"current_steps": 950, "total_steps": 134280, "loss": 0.7161, "lr": 3.5336610068513553e-06, "epoch": 0.14149538278224605, "percentage": 0.71, "elapsed_time": "0:03:40", "remaining_time": "8:35:51", "throughput": 2508.41, "total_tokens": 553184} +{"current_steps": 955, "total_steps": 134280, "loss": 0.7852, "lr": 3.5522788203753356e-06, "epoch": 0.14224009532320525, "percentage": 0.71, "elapsed_time": "0:03:41", "remaining_time": "8:35:47", "throughput": 2508.58, "total_tokens": 556096} +{"current_steps": 960, "total_steps": 134280, "loss": 0.7308, "lr": 3.570896633899315e-06, "epoch": 0.14298480786416443, "percentage": 0.71, "elapsed_time": "0:03:42", "remaining_time": "8:35:37", "throughput": 2508.3, "total_tokens": 558784} +{"current_steps": 965, "total_steps": 134280, "loss": 0.8799, "lr": 3.589514447423295e-06, "epoch": 0.14372952040512363, "percentage": 0.72, "elapsed_time": "0:03:43", "remaining_time": "8:35:36", "throughput": 2508.59, "total_tokens": 561760} +{"current_steps": 970, "total_steps": 134280, "loss": 0.7196, "lr": 3.6081322609472746e-06, "epoch": 0.1444742329460828, "percentage": 0.72, "elapsed_time": "0:03:45", "remaining_time": "8:35:29", "throughput": 2508.52, "total_tokens": 564544} +{"current_steps": 975, "total_steps": 134280, "loss": 0.6004, "lr": 3.6267500744712545e-06, "epoch": 0.145218945487042, "percentage": 0.73, "elapsed_time": "0:03:46", "remaining_time": "8:35:19", "throughput": 2508.14, "total_tokens": 567200} +{"current_steps": 980, "total_steps": 134280, "loss": 0.6157, "lr": 3.645367887995234e-06, "epoch": 0.14596365802800118, "percentage": 0.73, "elapsed_time": "0:03:47", "remaining_time": "8:35:20", "throughput": 2508.54, "total_tokens": 570240} +{"current_steps": 985, "total_steps": 134280, "loss": 0.7004, "lr": 3.663985701519214e-06, "epoch": 0.14670837056896038, "percentage": 0.73, "elapsed_time": "0:03:48", "remaining_time": "8:35:07", "throughput": 2508.32, "total_tokens": 572896} +{"current_steps": 990, "total_steps": 134280, "loss": 0.7115, "lr": 3.6826035150431934e-06, "epoch": 0.14745308310991956, "percentage": 0.74, "elapsed_time": "0:03:49", "remaining_time": "8:35:06", "throughput": 2508.12, "total_tokens": 575744} +{"current_steps": 995, "total_steps": 134280, "loss": 0.6919, "lr": 3.7012213285671734e-06, "epoch": 0.14819779565087876, "percentage": 0.74, "elapsed_time": "0:03:50", "remaining_time": "8:35:13", "throughput": 2508.27, "total_tokens": 578848} +{"current_steps": 1000, "total_steps": 134280, "loss": 0.8411, "lr": 3.719839142091153e-06, "epoch": 0.14894250819183796, "percentage": 0.74, "elapsed_time": "0:03:51", "remaining_time": "8:35:01", "throughput": 2508.07, "total_tokens": 581504} +{"current_steps": 1005, "total_steps": 134280, "loss": 0.7478, "lr": 3.738456955615133e-06, "epoch": 0.14968722073279714, "percentage": 0.75, "elapsed_time": "0:03:52", "remaining_time": "8:34:55", "throughput": 2507.82, "total_tokens": 584256} +{"current_steps": 1010, "total_steps": 134280, "loss": 0.8086, "lr": 3.7570747691391127e-06, "epoch": 0.15043193327375634, "percentage": 0.75, "elapsed_time": "0:03:54", "remaining_time": "8:34:43", "throughput": 2507.61, "total_tokens": 586912} +{"current_steps": 1015, "total_steps": 134280, "loss": 0.6916, "lr": 3.7756925826630922e-06, "epoch": 0.15117664581471552, "percentage": 0.76, "elapsed_time": "0:03:55", "remaining_time": "8:34:47", "throughput": 2507.63, "total_tokens": 589920} +{"current_steps": 1020, "total_steps": 134280, "loss": 0.7222, "lr": 3.794310396187072e-06, "epoch": 0.15192135835567472, "percentage": 0.76, "elapsed_time": "0:03:56", "remaining_time": "8:34:50", "throughput": 2507.95, "total_tokens": 592992} +{"current_steps": 1025, "total_steps": 134280, "loss": 0.6661, "lr": 3.8129282097110517e-06, "epoch": 0.1526660708966339, "percentage": 0.76, "elapsed_time": "0:03:57", "remaining_time": "8:34:46", "throughput": 2508.09, "total_tokens": 595872} +{"current_steps": 1030, "total_steps": 134280, "loss": 0.7223, "lr": 3.831546023235032e-06, "epoch": 0.1534107834375931, "percentage": 0.77, "elapsed_time": "0:03:58", "remaining_time": "8:34:51", "throughput": 2508.58, "total_tokens": 599008} +{"current_steps": 1035, "total_steps": 134280, "loss": 0.7227, "lr": 3.850163836759011e-06, "epoch": 0.15415549597855227, "percentage": 0.77, "elapsed_time": "0:03:59", "remaining_time": "8:34:43", "throughput": 2508.58, "total_tokens": 601792} +{"current_steps": 1040, "total_steps": 134280, "loss": 0.6208, "lr": 3.8687816502829914e-06, "epoch": 0.15490020851951147, "percentage": 0.77, "elapsed_time": "0:04:01", "remaining_time": "8:34:38", "throughput": 2508.52, "total_tokens": 604608} +{"current_steps": 1045, "total_steps": 134280, "loss": 0.7997, "lr": 3.8873994638069705e-06, "epoch": 0.15564492106047065, "percentage": 0.78, "elapsed_time": "0:04:02", "remaining_time": "8:34:23", "throughput": 2508.21, "total_tokens": 607168} +{"current_steps": 1050, "total_steps": 134280, "loss": 0.7294, "lr": 3.9060172773309504e-06, "epoch": 0.15638963360142985, "percentage": 0.78, "elapsed_time": "0:04:03", "remaining_time": "8:34:19", "throughput": 2508.35, "total_tokens": 610048} +{"current_steps": 1055, "total_steps": 134280, "loss": 0.6709, "lr": 3.92463509085493e-06, "epoch": 0.15713434614238903, "percentage": 0.79, "elapsed_time": "0:04:04", "remaining_time": "8:34:14", "throughput": 2508.31, "total_tokens": 612864} +{"current_steps": 1060, "total_steps": 134280, "loss": 0.7238, "lr": 3.94325290437891e-06, "epoch": 0.15787905868334823, "percentage": 0.79, "elapsed_time": "0:04:05", "remaining_time": "8:34:26", "throughput": 2508.57, "total_tokens": 616096} +{"current_steps": 1065, "total_steps": 134280, "loss": 0.7193, "lr": 3.961870717902889e-06, "epoch": 0.15862377122430743, "percentage": 0.79, "elapsed_time": "0:04:06", "remaining_time": "8:34:17", "throughput": 2508.31, "total_tokens": 618784} +{"current_steps": 1070, "total_steps": 134280, "loss": 0.7104, "lr": 3.980488531426869e-06, "epoch": 0.1593684837652666, "percentage": 0.8, "elapsed_time": "0:04:07", "remaining_time": "8:34:13", "throughput": 2508.17, "total_tokens": 621600} +{"current_steps": 1075, "total_steps": 134280, "loss": 0.7398, "lr": 3.999106344950849e-06, "epoch": 0.1601131963062258, "percentage": 0.8, "elapsed_time": "0:04:09", "remaining_time": "8:34:19", "throughput": 2508.43, "total_tokens": 624704} +{"current_steps": 1080, "total_steps": 134280, "loss": 0.8088, "lr": 4.017724158474829e-06, "epoch": 0.16085790884718498, "percentage": 0.8, "elapsed_time": "0:04:10", "remaining_time": "8:34:26", "throughput": 2508.51, "total_tokens": 627808} +{"current_steps": 1085, "total_steps": 134280, "loss": 0.8075, "lr": 4.036341971998809e-06, "epoch": 0.16160262138814419, "percentage": 0.81, "elapsed_time": "0:04:11", "remaining_time": "8:34:25", "throughput": 2508.43, "total_tokens": 630688} +{"current_steps": 1090, "total_steps": 134280, "loss": 0.7266, "lr": 4.054959785522788e-06, "epoch": 0.16234733392910336, "percentage": 0.81, "elapsed_time": "0:04:12", "remaining_time": "8:34:23", "throughput": 2508.52, "total_tokens": 633600} +{"current_steps": 1095, "total_steps": 134280, "loss": 0.7559, "lr": 4.073577599046768e-06, "epoch": 0.16309204647006256, "percentage": 0.82, "elapsed_time": "0:04:13", "remaining_time": "8:34:30", "throughput": 2508.46, "total_tokens": 636672} +{"current_steps": 1100, "total_steps": 134280, "loss": 0.7626, "lr": 4.092195412570748e-06, "epoch": 0.16383675901102174, "percentage": 0.82, "elapsed_time": "0:04:14", "remaining_time": "8:34:17", "throughput": 2507.81, "total_tokens": 639168} +{"current_steps": 1105, "total_steps": 134280, "loss": 0.7512, "lr": 4.110813226094728e-06, "epoch": 0.16458147155198094, "percentage": 0.82, "elapsed_time": "0:04:16", "remaining_time": "8:34:14", "throughput": 2507.63, "total_tokens": 641984} +{"current_steps": 1110, "total_steps": 134280, "loss": 0.7192, "lr": 4.129431039618707e-06, "epoch": 0.16532618409294011, "percentage": 0.83, "elapsed_time": "0:04:17", "remaining_time": "8:34:31", "throughput": 2508.22, "total_tokens": 645408} +{"current_steps": 1115, "total_steps": 134280, "loss": 0.8555, "lr": 4.148048853142687e-06, "epoch": 0.16607089663389932, "percentage": 0.83, "elapsed_time": "0:04:18", "remaining_time": "8:34:21", "throughput": 2507.79, "total_tokens": 648032} +{"current_steps": 1120, "total_steps": 134280, "loss": 0.7054, "lr": 4.166666666666667e-06, "epoch": 0.1668156091748585, "percentage": 0.83, "elapsed_time": "0:04:19", "remaining_time": "8:34:32", "throughput": 2507.98, "total_tokens": 651232} +{"current_steps": 1125, "total_steps": 134280, "loss": 0.6966, "lr": 4.185284480190647e-06, "epoch": 0.1675603217158177, "percentage": 0.84, "elapsed_time": "0:04:20", "remaining_time": "8:34:28", "throughput": 2508.1, "total_tokens": 654112} +{"current_steps": 1130, "total_steps": 134280, "loss": 0.6729, "lr": 4.203902293714626e-06, "epoch": 0.1683050342567769, "percentage": 0.84, "elapsed_time": "0:04:22", "remaining_time": "8:34:34", "throughput": 2508.15, "total_tokens": 657184} +{"current_steps": 1135, "total_steps": 134280, "loss": 0.7181, "lr": 4.222520107238606e-06, "epoch": 0.16904974679773607, "percentage": 0.85, "elapsed_time": "0:04:23", "remaining_time": "8:34:28", "throughput": 2507.93, "total_tokens": 659936} +{"current_steps": 1140, "total_steps": 134280, "loss": 0.6583, "lr": 4.241137920762586e-06, "epoch": 0.16979445933869527, "percentage": 0.85, "elapsed_time": "0:04:24", "remaining_time": "8:34:28", "throughput": 2508.0, "total_tokens": 662880} +{"current_steps": 1145, "total_steps": 134280, "loss": 0.792, "lr": 4.259755734286566e-06, "epoch": 0.17053917187965445, "percentage": 0.85, "elapsed_time": "0:04:25", "remaining_time": "8:34:24", "throughput": 2508.13, "total_tokens": 665760} +{"current_steps": 1150, "total_steps": 134280, "loss": 0.8351, "lr": 4.278373547810546e-06, "epoch": 0.17128388442061365, "percentage": 0.86, "elapsed_time": "0:04:26", "remaining_time": "8:34:24", "throughput": 2507.99, "total_tokens": 668672} +{"current_steps": 1155, "total_steps": 134280, "loss": 0.7889, "lr": 4.296991361334525e-06, "epoch": 0.17202859696157283, "percentage": 0.86, "elapsed_time": "0:04:27", "remaining_time": "8:34:17", "throughput": 2507.92, "total_tokens": 671424} +{"current_steps": 1160, "total_steps": 134280, "loss": 0.8382, "lr": 4.3156091748585054e-06, "epoch": 0.17277330950253203, "percentage": 0.86, "elapsed_time": "0:04:28", "remaining_time": "8:34:12", "throughput": 2507.62, "total_tokens": 674176} +{"current_steps": 1165, "total_steps": 134280, "loss": 0.7197, "lr": 4.3342269883824845e-06, "epoch": 0.1735180220434912, "percentage": 0.87, "elapsed_time": "0:04:29", "remaining_time": "8:34:06", "throughput": 2507.73, "total_tokens": 676992} +{"current_steps": 1170, "total_steps": 134280, "loss": 0.674, "lr": 4.3528448019064644e-06, "epoch": 0.1742627345844504, "percentage": 0.87, "elapsed_time": "0:04:31", "remaining_time": "8:34:05", "throughput": 2507.86, "total_tokens": 679936} +{"current_steps": 1175, "total_steps": 134280, "loss": 0.612, "lr": 4.3714626154304435e-06, "epoch": 0.17500744712540958, "percentage": 0.88, "elapsed_time": "0:04:32", "remaining_time": "8:33:59", "throughput": 2507.57, "total_tokens": 682656} +{"current_steps": 1180, "total_steps": 134280, "loss": 0.7526, "lr": 4.390080428954424e-06, "epoch": 0.17575215966636878, "percentage": 0.88, "elapsed_time": "0:04:33", "remaining_time": "8:33:51", "throughput": 2507.43, "total_tokens": 685376} +{"current_steps": 1185, "total_steps": 134280, "loss": 0.7914, "lr": 4.408698242478403e-06, "epoch": 0.17649687220732796, "percentage": 0.88, "elapsed_time": "0:04:34", "remaining_time": "8:33:41", "throughput": 2507.18, "total_tokens": 688000} +{"current_steps": 1190, "total_steps": 134280, "loss": 0.6554, "lr": 4.427316056002383e-06, "epoch": 0.17724158474828716, "percentage": 0.89, "elapsed_time": "0:04:35", "remaining_time": "8:33:32", "throughput": 2507.26, "total_tokens": 690752} +{"current_steps": 1195, "total_steps": 134280, "loss": 0.6561, "lr": 4.445933869526362e-06, "epoch": 0.17798629728924636, "percentage": 0.89, "elapsed_time": "0:04:36", "remaining_time": "8:33:30", "throughput": 2507.42, "total_tokens": 693696} +{"current_steps": 1200, "total_steps": 134280, "loss": 0.8017, "lr": 4.464551683050343e-06, "epoch": 0.17873100983020554, "percentage": 0.89, "elapsed_time": "0:04:37", "remaining_time": "8:33:35", "throughput": 2507.77, "total_tokens": 696832} +{"current_steps": 1205, "total_steps": 134280, "loss": 0.8048, "lr": 4.483169496574322e-06, "epoch": 0.17947572237116474, "percentage": 0.9, "elapsed_time": "0:04:39", "remaining_time": "8:33:49", "throughput": 2508.21, "total_tokens": 700192} +{"current_steps": 1210, "total_steps": 134280, "loss": 0.7145, "lr": 4.501787310098302e-06, "epoch": 0.18022043491212392, "percentage": 0.9, "elapsed_time": "0:04:40", "remaining_time": "8:33:44", "throughput": 2508.09, "total_tokens": 702976} +{"current_steps": 1215, "total_steps": 134280, "loss": 0.6268, "lr": 4.520405123622282e-06, "epoch": 0.18096514745308312, "percentage": 0.9, "elapsed_time": "0:04:41", "remaining_time": "8:33:36", "throughput": 2507.95, "total_tokens": 705696} +{"current_steps": 1220, "total_steps": 134280, "loss": 0.6908, "lr": 4.539022937146262e-06, "epoch": 0.1817098599940423, "percentage": 0.91, "elapsed_time": "0:04:42", "remaining_time": "8:33:32", "throughput": 2507.99, "total_tokens": 708544} +{"current_steps": 1225, "total_steps": 134280, "loss": 0.7162, "lr": 4.557640750670242e-06, "epoch": 0.1824545725350015, "percentage": 0.91, "elapsed_time": "0:04:43", "remaining_time": "8:33:23", "throughput": 2507.61, "total_tokens": 711168} +{"current_steps": 1230, "total_steps": 134280, "loss": 0.7855, "lr": 4.576258564194221e-06, "epoch": 0.18319928507596067, "percentage": 0.92, "elapsed_time": "0:04:44", "remaining_time": "8:33:26", "throughput": 2507.71, "total_tokens": 714176} +{"current_steps": 1235, "total_steps": 134280, "loss": 0.6927, "lr": 4.594876377718201e-06, "epoch": 0.18394399761691987, "percentage": 0.92, "elapsed_time": "0:04:45", "remaining_time": "8:33:16", "throughput": 2507.46, "total_tokens": 716800} +{"current_steps": 1240, "total_steps": 134280, "loss": 0.6863, "lr": 4.613494191242181e-06, "epoch": 0.18468871015787905, "percentage": 0.92, "elapsed_time": "0:04:47", "remaining_time": "8:33:13", "throughput": 2507.59, "total_tokens": 719712} +{"current_steps": 1245, "total_steps": 134280, "loss": 0.6874, "lr": 4.632112004766161e-06, "epoch": 0.18543342269883825, "percentage": 0.93, "elapsed_time": "0:04:48", "remaining_time": "8:33:16", "throughput": 2507.61, "total_tokens": 722720} +{"current_steps": 1250, "total_steps": 134280, "loss": 0.8331, "lr": 4.65072981829014e-06, "epoch": 0.18617813523979743, "percentage": 0.93, "elapsed_time": "0:04:49", "remaining_time": "8:33:05", "throughput": 2507.14, "total_tokens": 725248} +{"current_steps": 1255, "total_steps": 134280, "loss": 0.6915, "lr": 4.66934763181412e-06, "epoch": 0.18692284778075663, "percentage": 0.93, "elapsed_time": "0:04:50", "remaining_time": "8:33:02", "throughput": 2507.33, "total_tokens": 728160} +{"current_steps": 1260, "total_steps": 134280, "loss": 0.7238, "lr": 4.6879654453381e-06, "epoch": 0.1876675603217158, "percentage": 0.94, "elapsed_time": "0:04:51", "remaining_time": "8:32:58", "throughput": 2507.38, "total_tokens": 731008} +{"current_steps": 1265, "total_steps": 134280, "loss": 0.6573, "lr": 4.70658325886208e-06, "epoch": 0.188412272862675, "percentage": 0.94, "elapsed_time": "0:04:52", "remaining_time": "8:32:55", "throughput": 2507.27, "total_tokens": 733824} +{"current_steps": 1270, "total_steps": 134280, "loss": 0.6318, "lr": 4.725201072386059e-06, "epoch": 0.1891569854036342, "percentage": 0.95, "elapsed_time": "0:04:53", "remaining_time": "8:32:50", "throughput": 2507.25, "total_tokens": 736640} +{"current_steps": 1275, "total_steps": 134280, "loss": 0.6707, "lr": 4.743818885910039e-06, "epoch": 0.18990169794459338, "percentage": 0.95, "elapsed_time": "0:04:54", "remaining_time": "8:32:47", "throughput": 2507.22, "total_tokens": 739488} +{"current_steps": 1280, "total_steps": 134280, "loss": 0.7405, "lr": 4.7624366994340194e-06, "epoch": 0.1906464104855526, "percentage": 0.95, "elapsed_time": "0:04:56", "remaining_time": "8:32:40", "throughput": 2507.0, "total_tokens": 742176} +{"current_steps": 1285, "total_steps": 134280, "loss": 0.5949, "lr": 4.7810545129579985e-06, "epoch": 0.19139112302651176, "percentage": 0.96, "elapsed_time": "0:04:57", "remaining_time": "8:32:41", "throughput": 2507.22, "total_tokens": 745184} +{"current_steps": 1290, "total_steps": 134280, "loss": 0.6681, "lr": 4.7996723264819784e-06, "epoch": 0.19213583556747096, "percentage": 0.96, "elapsed_time": "0:04:58", "remaining_time": "8:32:44", "throughput": 2507.32, "total_tokens": 748224} +{"current_steps": 1295, "total_steps": 134280, "loss": 0.7054, "lr": 4.8182901400059575e-06, "epoch": 0.19288054810843014, "percentage": 0.96, "elapsed_time": "0:04:59", "remaining_time": "8:32:38", "throughput": 2507.12, "total_tokens": 750944} +{"current_steps": 1300, "total_steps": 134280, "loss": 0.6661, "lr": 4.836907953529938e-06, "epoch": 0.19362526064938934, "percentage": 0.97, "elapsed_time": "0:05:00", "remaining_time": "8:32:36", "throughput": 2507.3, "total_tokens": 753888} +{"current_steps": 1305, "total_steps": 134280, "loss": 0.7805, "lr": 4.855525767053917e-06, "epoch": 0.19436997319034852, "percentage": 0.97, "elapsed_time": "0:05:01", "remaining_time": "8:32:32", "throughput": 2507.27, "total_tokens": 756704} +{"current_steps": 1310, "total_steps": 134280, "loss": 0.6147, "lr": 4.874143580577897e-06, "epoch": 0.19511468573130772, "percentage": 0.98, "elapsed_time": "0:05:03", "remaining_time": "8:32:39", "throughput": 2507.61, "total_tokens": 759904} +{"current_steps": 1315, "total_steps": 134280, "loss": 0.6913, "lr": 4.892761394101876e-06, "epoch": 0.1958593982722669, "percentage": 0.98, "elapsed_time": "0:05:04", "remaining_time": "8:32:37", "throughput": 2507.87, "total_tokens": 762848} +{"current_steps": 1320, "total_steps": 134280, "loss": 0.6274, "lr": 4.911379207625857e-06, "epoch": 0.1966041108132261, "percentage": 0.98, "elapsed_time": "0:05:05", "remaining_time": "8:32:30", "throughput": 2507.6, "total_tokens": 765536} +{"current_steps": 1325, "total_steps": 134280, "loss": 0.6771, "lr": 4.929997021149836e-06, "epoch": 0.19734882335418527, "percentage": 0.99, "elapsed_time": "0:05:06", "remaining_time": "8:32:26", "throughput": 2507.64, "total_tokens": 768384} +{"current_steps": 1330, "total_steps": 134280, "loss": 0.5998, "lr": 4.948614834673816e-06, "epoch": 0.19809353589514447, "percentage": 0.99, "elapsed_time": "0:05:07", "remaining_time": "8:32:31", "throughput": 2508.03, "total_tokens": 771552} +{"current_steps": 1335, "total_steps": 134280, "loss": 0.7178, "lr": 4.967232648197795e-06, "epoch": 0.19883824843610368, "percentage": 0.99, "elapsed_time": "0:05:08", "remaining_time": "8:32:28", "throughput": 2507.85, "total_tokens": 774336} +{"current_steps": 1340, "total_steps": 134280, "loss": 0.7107, "lr": 4.985850461721776e-06, "epoch": 0.19958296097706285, "percentage": 1.0, "elapsed_time": "0:05:09", "remaining_time": "8:32:27", "throughput": 2508.06, "total_tokens": 777312} +{"current_steps": 1345, "total_steps": 134280, "loss": 0.9109, "lr": 5.004468275245756e-06, "epoch": 0.20032767351802205, "percentage": 1.0, "elapsed_time": "0:05:11", "remaining_time": "8:32:19", "throughput": 2508.03, "total_tokens": 780032} +{"current_steps": 1350, "total_steps": 134280, "loss": 0.5458, "lr": 5.023086088769735e-06, "epoch": 0.20107238605898123, "percentage": 1.01, "elapsed_time": "0:05:12", "remaining_time": "8:32:12", "throughput": 2507.81, "total_tokens": 782720} +{"current_steps": 1355, "total_steps": 134280, "loss": 0.7233, "lr": 5.041703902293715e-06, "epoch": 0.20181709859994043, "percentage": 1.01, "elapsed_time": "0:05:13", "remaining_time": "8:32:13", "throughput": 2508.09, "total_tokens": 785760} +{"current_steps": 1360, "total_steps": 134280, "loss": 0.6715, "lr": 5.060321715817695e-06, "epoch": 0.2025618111408996, "percentage": 1.01, "elapsed_time": "0:05:14", "remaining_time": "8:32:11", "throughput": 2508.0, "total_tokens": 788608} +{"current_steps": 1365, "total_steps": 134280, "loss": 0.7934, "lr": 5.078939529341675e-06, "epoch": 0.2033065236818588, "percentage": 1.02, "elapsed_time": "0:05:15", "remaining_time": "8:32:21", "throughput": 2508.27, "total_tokens": 791872} +{"current_steps": 1370, "total_steps": 134280, "loss": 0.6949, "lr": 5.097557342865654e-06, "epoch": 0.20405123622281798, "percentage": 1.02, "elapsed_time": "0:05:16", "remaining_time": "8:32:30", "throughput": 2508.55, "total_tokens": 795136} +{"current_steps": 1375, "total_steps": 134280, "loss": 0.7604, "lr": 5.116175156389634e-06, "epoch": 0.20479594876377719, "percentage": 1.02, "elapsed_time": "0:05:18", "remaining_time": "8:32:27", "throughput": 2508.73, "total_tokens": 798048} +{"current_steps": 1380, "total_steps": 134280, "loss": 0.6331, "lr": 5.134792969913614e-06, "epoch": 0.20554066130473636, "percentage": 1.03, "elapsed_time": "0:05:19", "remaining_time": "8:32:17", "throughput": 2508.3, "total_tokens": 800576} +{"current_steps": 1385, "total_steps": 134280, "loss": 0.7416, "lr": 5.153410783437594e-06, "epoch": 0.20628537384569556, "percentage": 1.03, "elapsed_time": "0:05:20", "remaining_time": "8:32:20", "throughput": 2508.39, "total_tokens": 803616} +{"current_steps": 1390, "total_steps": 134280, "loss": 0.9036, "lr": 5.172028596961573e-06, "epoch": 0.20703008638665474, "percentage": 1.04, "elapsed_time": "0:05:21", "remaining_time": "8:32:14", "throughput": 2508.13, "total_tokens": 806304} +{"current_steps": 1395, "total_steps": 134280, "loss": 0.8134, "lr": 5.190646410485553e-06, "epoch": 0.20777479892761394, "percentage": 1.04, "elapsed_time": "0:05:22", "remaining_time": "8:32:09", "throughput": 2507.75, "total_tokens": 808992} +{"current_steps": 1400, "total_steps": 134280, "loss": 0.67, "lr": 5.209264224009533e-06, "epoch": 0.20851951146857314, "percentage": 1.04, "elapsed_time": "0:05:23", "remaining_time": "8:32:09", "throughput": 2507.75, "total_tokens": 811904} +{"current_steps": 1405, "total_steps": 134280, "loss": 0.7022, "lr": 5.2278820375335125e-06, "epoch": 0.20926422400953232, "percentage": 1.05, "elapsed_time": "0:05:24", "remaining_time": "8:32:13", "throughput": 2508.11, "total_tokens": 815072} +{"current_steps": 1410, "total_steps": 134280, "loss": 0.8943, "lr": 5.2464998510574924e-06, "epoch": 0.21000893655049152, "percentage": 1.05, "elapsed_time": "0:05:26", "remaining_time": "8:32:13", "throughput": 2508.17, "total_tokens": 818016} +{"current_steps": 1415, "total_steps": 134280, "loss": 0.6466, "lr": 5.2651176645814715e-06, "epoch": 0.2107536490914507, "percentage": 1.05, "elapsed_time": "0:05:27", "remaining_time": "8:32:13", "throughput": 2508.04, "total_tokens": 820896} +{"current_steps": 1420, "total_steps": 134280, "loss": 0.6707, "lr": 5.2837354781054514e-06, "epoch": 0.2114983616324099, "percentage": 1.06, "elapsed_time": "0:05:28", "remaining_time": "8:32:02", "throughput": 2507.94, "total_tokens": 823520} +{"current_steps": 1425, "total_steps": 134280, "loss": 0.7403, "lr": 5.302353291629431e-06, "epoch": 0.21224307417336907, "percentage": 1.06, "elapsed_time": "0:05:29", "remaining_time": "8:31:52", "throughput": 2507.84, "total_tokens": 826144} +{"current_steps": 1430, "total_steps": 134280, "loss": 0.6748, "lr": 5.320971105153411e-06, "epoch": 0.21298778671432828, "percentage": 1.06, "elapsed_time": "0:05:30", "remaining_time": "8:31:43", "throughput": 2507.63, "total_tokens": 828768} +{"current_steps": 1435, "total_steps": 134280, "loss": 0.761, "lr": 5.33958891867739e-06, "epoch": 0.21373249925528745, "percentage": 1.07, "elapsed_time": "0:05:31", "remaining_time": "8:31:48", "throughput": 2507.98, "total_tokens": 831936} +{"current_steps": 1440, "total_steps": 134280, "loss": 0.6772, "lr": 5.35820673220137e-06, "epoch": 0.21447721179624665, "percentage": 1.07, "elapsed_time": "0:05:32", "remaining_time": "8:31:49", "throughput": 2508.32, "total_tokens": 835008} +{"current_steps": 1445, "total_steps": 134280, "loss": 0.7713, "lr": 5.37682454572535e-06, "epoch": 0.21522192433720583, "percentage": 1.08, "elapsed_time": "0:05:33", "remaining_time": "8:31:39", "throughput": 2508.16, "total_tokens": 837600} +{"current_steps": 1450, "total_steps": 134280, "loss": 0.7443, "lr": 5.39544235924933e-06, "epoch": 0.21596663687816503, "percentage": 1.08, "elapsed_time": "0:05:35", "remaining_time": "8:31:36", "throughput": 2508.26, "total_tokens": 840480} +{"current_steps": 1455, "total_steps": 134280, "loss": 0.6932, "lr": 5.414060172773309e-06, "epoch": 0.2167113494191242, "percentage": 1.08, "elapsed_time": "0:05:36", "remaining_time": "8:31:33", "throughput": 2508.49, "total_tokens": 843424} +{"current_steps": 1460, "total_steps": 134280, "loss": 0.6279, "lr": 5.43267798629729e-06, "epoch": 0.2174560619600834, "percentage": 1.09, "elapsed_time": "0:05:37", "remaining_time": "8:31:30", "throughput": 2508.52, "total_tokens": 846272} +{"current_steps": 1465, "total_steps": 134280, "loss": 0.7262, "lr": 5.451295799821269e-06, "epoch": 0.2182007745010426, "percentage": 1.09, "elapsed_time": "0:05:38", "remaining_time": "8:31:30", "throughput": 2508.52, "total_tokens": 849216} +{"current_steps": 1470, "total_steps": 134280, "loss": 0.8108, "lr": 5.469913613345249e-06, "epoch": 0.21894548704200179, "percentage": 1.09, "elapsed_time": "0:05:39", "remaining_time": "8:31:25", "throughput": 2508.6, "total_tokens": 852032} +{"current_steps": 1475, "total_steps": 134280, "loss": 0.6887, "lr": 5.488531426869229e-06, "epoch": 0.219690199582961, "percentage": 1.1, "elapsed_time": "0:05:40", "remaining_time": "8:31:25", "throughput": 2508.97, "total_tokens": 855072} +{"current_steps": 1480, "total_steps": 134280, "loss": 0.7446, "lr": 5.507149240393209e-06, "epoch": 0.22043491212392016, "percentage": 1.1, "elapsed_time": "0:05:41", "remaining_time": "8:31:20", "throughput": 2508.66, "total_tokens": 857760} +{"current_steps": 1485, "total_steps": 134280, "loss": 0.8068, "lr": 5.525767053917189e-06, "epoch": 0.22117962466487937, "percentage": 1.11, "elapsed_time": "0:05:43", "remaining_time": "8:31:24", "throughput": 2509.0, "total_tokens": 860928} +{"current_steps": 1490, "total_steps": 134280, "loss": 0.7454, "lr": 5.544384867441168e-06, "epoch": 0.22192433720583854, "percentage": 1.11, "elapsed_time": "0:05:44", "remaining_time": "8:31:27", "throughput": 2509.26, "total_tokens": 864032} +{"current_steps": 1495, "total_steps": 134280, "loss": 0.9631, "lr": 5.563002680965148e-06, "epoch": 0.22266904974679774, "percentage": 1.11, "elapsed_time": "0:05:45", "remaining_time": "8:31:28", "throughput": 2509.44, "total_tokens": 867040} +{"current_steps": 1500, "total_steps": 134280, "loss": 0.7065, "lr": 5.581620494489128e-06, "epoch": 0.22341376228775692, "percentage": 1.12, "elapsed_time": "0:05:46", "remaining_time": "8:31:32", "throughput": 2509.27, "total_tokens": 870048} +{"current_steps": 1505, "total_steps": 134280, "loss": 0.7803, "lr": 5.600238308013108e-06, "epoch": 0.22415847482871612, "percentage": 1.12, "elapsed_time": "0:05:48", "remaining_time": "8:31:47", "throughput": 2509.91, "total_tokens": 873632} +{"current_steps": 1510, "total_steps": 134280, "loss": 0.7369, "lr": 5.618856121537087e-06, "epoch": 0.2249031873696753, "percentage": 1.12, "elapsed_time": "0:05:49", "remaining_time": "8:31:47", "throughput": 2510.03, "total_tokens": 876608} +{"current_steps": 1515, "total_steps": 134280, "loss": 0.7941, "lr": 5.637473935061067e-06, "epoch": 0.2256478999106345, "percentage": 1.13, "elapsed_time": "0:05:50", "remaining_time": "8:31:44", "throughput": 2509.94, "total_tokens": 879424} +{"current_steps": 1520, "total_steps": 134280, "loss": 0.6208, "lr": 5.656091748585047e-06, "epoch": 0.22639261245159367, "percentage": 1.13, "elapsed_time": "0:05:51", "remaining_time": "8:31:45", "throughput": 2510.24, "total_tokens": 882496} +{"current_steps": 1525, "total_steps": 134280, "loss": 0.7128, "lr": 5.6747095621090265e-06, "epoch": 0.22713732499255287, "percentage": 1.14, "elapsed_time": "0:05:52", "remaining_time": "8:31:51", "throughput": 2510.35, "total_tokens": 885632} +{"current_steps": 1530, "total_steps": 134280, "loss": 0.5632, "lr": 5.693327375633006e-06, "epoch": 0.22788203753351208, "percentage": 1.14, "elapsed_time": "0:05:53", "remaining_time": "8:31:49", "throughput": 2510.29, "total_tokens": 888480} +{"current_steps": 1535, "total_steps": 134280, "loss": 0.6303, "lr": 5.7119451891569855e-06, "epoch": 0.22862675007447125, "percentage": 1.14, "elapsed_time": "0:05:55", "remaining_time": "8:31:46", "throughput": 2510.45, "total_tokens": 891392} +{"current_steps": 1540, "total_steps": 134280, "loss": 0.5718, "lr": 5.7305630026809654e-06, "epoch": 0.22937146261543045, "percentage": 1.15, "elapsed_time": "0:05:56", "remaining_time": "8:31:45", "throughput": 2510.55, "total_tokens": 894336} +{"current_steps": 1545, "total_steps": 134280, "loss": 0.5616, "lr": 5.749180816204945e-06, "epoch": 0.23011617515638963, "percentage": 1.15, "elapsed_time": "0:05:57", "remaining_time": "8:31:45", "throughput": 2510.59, "total_tokens": 897280} +{"current_steps": 1550, "total_steps": 134280, "loss": 0.9463, "lr": 5.767798629728925e-06, "epoch": 0.23086088769734883, "percentage": 1.15, "elapsed_time": "0:05:58", "remaining_time": "8:31:43", "throughput": 2510.67, "total_tokens": 900192} +{"current_steps": 1555, "total_steps": 134280, "loss": 0.6747, "lr": 5.786416443252904e-06, "epoch": 0.231605600238308, "percentage": 1.16, "elapsed_time": "0:05:59", "remaining_time": "8:31:45", "throughput": 2510.79, "total_tokens": 903232} +{"current_steps": 1560, "total_steps": 134280, "loss": 0.6416, "lr": 5.805034256776884e-06, "epoch": 0.2323503127792672, "percentage": 1.16, "elapsed_time": "0:06:00", "remaining_time": "8:31:41", "throughput": 2510.8, "total_tokens": 906080} +{"current_steps": 1565, "total_steps": 134280, "loss": 0.6658, "lr": 5.823652070300864e-06, "epoch": 0.23309502532022638, "percentage": 1.17, "elapsed_time": "0:06:01", "remaining_time": "8:31:37", "throughput": 2510.8, "total_tokens": 908896} +{"current_steps": 1570, "total_steps": 134280, "loss": 0.7822, "lr": 5.842269883824844e-06, "epoch": 0.2338397378611856, "percentage": 1.17, "elapsed_time": "0:06:03", "remaining_time": "8:31:37", "throughput": 2510.85, "total_tokens": 911840} +{"current_steps": 1575, "total_steps": 134280, "loss": 0.8105, "lr": 5.860887697348823e-06, "epoch": 0.23458445040214476, "percentage": 1.17, "elapsed_time": "0:06:04", "remaining_time": "8:31:39", "throughput": 2510.9, "total_tokens": 914848} +{"current_steps": 1580, "total_steps": 134280, "loss": 0.7656, "lr": 5.879505510872803e-06, "epoch": 0.23532916294310396, "percentage": 1.18, "elapsed_time": "0:06:05", "remaining_time": "8:31:38", "throughput": 2510.94, "total_tokens": 917792} +{"current_steps": 1585, "total_steps": 134280, "loss": 0.8031, "lr": 5.898123324396783e-06, "epoch": 0.23607387548406314, "percentage": 1.18, "elapsed_time": "0:06:06", "remaining_time": "8:31:33", "throughput": 2511.0, "total_tokens": 920608} +{"current_steps": 1590, "total_steps": 134280, "loss": 0.8282, "lr": 5.916741137920763e-06, "epoch": 0.23681858802502234, "percentage": 1.18, "elapsed_time": "0:06:07", "remaining_time": "8:31:35", "throughput": 2511.18, "total_tokens": 923648} +{"current_steps": 1595, "total_steps": 134280, "loss": 0.6704, "lr": 5.935358951444742e-06, "epoch": 0.23756330056598154, "percentage": 1.19, "elapsed_time": "0:06:08", "remaining_time": "8:31:35", "throughput": 2511.0, "total_tokens": 926528} +{"current_steps": 1600, "total_steps": 134280, "loss": 0.6697, "lr": 5.953976764968722e-06, "epoch": 0.23830801310694072, "percentage": 1.19, "elapsed_time": "0:06:10", "remaining_time": "8:31:29", "throughput": 2510.75, "total_tokens": 929184} +{"current_steps": 1605, "total_steps": 134280, "loss": 0.7255, "lr": 5.972594578492702e-06, "epoch": 0.23905272564789992, "percentage": 1.2, "elapsed_time": "0:06:11", "remaining_time": "8:31:21", "throughput": 2510.67, "total_tokens": 931872} +{"current_steps": 1610, "total_steps": 134280, "loss": 0.6378, "lr": 5.991212392016682e-06, "epoch": 0.2397974381888591, "percentage": 1.2, "elapsed_time": "0:06:12", "remaining_time": "8:31:18", "throughput": 2510.64, "total_tokens": 934688} +{"current_steps": 1615, "total_steps": 134280, "loss": 0.607, "lr": 6.009830205540662e-06, "epoch": 0.2405421507298183, "percentage": 1.2, "elapsed_time": "0:06:13", "remaining_time": "8:31:28", "throughput": 2510.89, "total_tokens": 938048} +{"current_steps": 1620, "total_steps": 134280, "loss": 0.813, "lr": 6.028448019064641e-06, "epoch": 0.24128686327077747, "percentage": 1.21, "elapsed_time": "0:06:14", "remaining_time": "8:31:25", "throughput": 2510.85, "total_tokens": 940864} +{"current_steps": 1625, "total_steps": 134280, "loss": 0.7278, "lr": 6.047065832588622e-06, "epoch": 0.24203157581173668, "percentage": 1.21, "elapsed_time": "0:06:15", "remaining_time": "8:31:25", "throughput": 2510.88, "total_tokens": 943808} +{"current_steps": 1630, "total_steps": 134280, "loss": 0.581, "lr": 6.065683646112601e-06, "epoch": 0.24277628835269585, "percentage": 1.21, "elapsed_time": "0:06:17", "remaining_time": "8:31:28", "throughput": 2511.25, "total_tokens": 946976} +{"current_steps": 1635, "total_steps": 134280, "loss": 0.5808, "lr": 6.084301459636581e-06, "epoch": 0.24352100089365505, "percentage": 1.22, "elapsed_time": "0:06:18", "remaining_time": "8:31:23", "throughput": 2511.03, "total_tokens": 949696} +{"current_steps": 1640, "total_steps": 134280, "loss": 0.7803, "lr": 6.10291927316056e-06, "epoch": 0.24426571343461423, "percentage": 1.22, "elapsed_time": "0:06:19", "remaining_time": "8:31:21", "throughput": 2510.84, "total_tokens": 952512} +{"current_steps": 1645, "total_steps": 134280, "loss": 0.7388, "lr": 6.1215370866845405e-06, "epoch": 0.24501042597557343, "percentage": 1.23, "elapsed_time": "0:06:20", "remaining_time": "8:31:15", "throughput": 2510.66, "total_tokens": 955200} +{"current_steps": 1650, "total_steps": 134280, "loss": 0.5768, "lr": 6.14015490020852e-06, "epoch": 0.2457551385165326, "percentage": 1.23, "elapsed_time": "0:06:21", "remaining_time": "8:31:11", "throughput": 2510.78, "total_tokens": 958048} +{"current_steps": 1655, "total_steps": 134280, "loss": 0.6266, "lr": 6.1587727137324995e-06, "epoch": 0.2464998510574918, "percentage": 1.23, "elapsed_time": "0:06:22", "remaining_time": "8:31:15", "throughput": 2510.86, "total_tokens": 961152} +{"current_steps": 1660, "total_steps": 134280, "loss": 0.6659, "lr": 6.1773905272564794e-06, "epoch": 0.247244563598451, "percentage": 1.24, "elapsed_time": "0:06:23", "remaining_time": "8:31:15", "throughput": 2510.68, "total_tokens": 964000} +{"current_steps": 1665, "total_steps": 134280, "loss": 0.8112, "lr": 6.196008340780459e-06, "epoch": 0.2479892761394102, "percentage": 1.24, "elapsed_time": "0:06:25", "remaining_time": "8:31:08", "throughput": 2510.45, "total_tokens": 966656} +{"current_steps": 1670, "total_steps": 134280, "loss": 0.8024, "lr": 6.2146261543044384e-06, "epoch": 0.2487339886803694, "percentage": 1.24, "elapsed_time": "0:06:26", "remaining_time": "8:31:11", "throughput": 2510.64, "total_tokens": 969760} +{"current_steps": 1675, "total_steps": 134280, "loss": 0.8954, "lr": 6.233243967828418e-06, "epoch": 0.24947870122132856, "percentage": 1.25, "elapsed_time": "0:06:27", "remaining_time": "8:31:09", "throughput": 2510.77, "total_tokens": 972672} +{"current_steps": 1680, "total_steps": 134280, "loss": 0.7499, "lr": 6.251861781352398e-06, "epoch": 0.25022341376228774, "percentage": 1.25, "elapsed_time": "0:06:28", "remaining_time": "8:31:07", "throughput": 2510.76, "total_tokens": 975552} +{"current_steps": 1685, "total_steps": 134280, "loss": 0.509, "lr": 6.270479594876379e-06, "epoch": 0.25096812630324694, "percentage": 1.25, "elapsed_time": "0:06:29", "remaining_time": "8:31:02", "throughput": 2510.66, "total_tokens": 978304} +{"current_steps": 1690, "total_steps": 134280, "loss": 0.608, "lr": 6.289097408400357e-06, "epoch": 0.25171283884420614, "percentage": 1.26, "elapsed_time": "0:06:30", "remaining_time": "8:30:57", "throughput": 2510.66, "total_tokens": 981088} +{"current_steps": 1695, "total_steps": 134280, "loss": 0.7005, "lr": 6.307715221924337e-06, "epoch": 0.25245755138516535, "percentage": 1.26, "elapsed_time": "0:06:31", "remaining_time": "8:30:50", "throughput": 2510.48, "total_tokens": 983712} +{"current_steps": 1700, "total_steps": 134280, "loss": 0.8175, "lr": 6.326333035448317e-06, "epoch": 0.2532022639261245, "percentage": 1.27, "elapsed_time": "0:06:33", "remaining_time": "8:30:51", "throughput": 2510.75, "total_tokens": 986784} +{"current_steps": 1705, "total_steps": 134280, "loss": 0.728, "lr": 6.344950848972298e-06, "epoch": 0.2539469764670837, "percentage": 1.27, "elapsed_time": "0:06:34", "remaining_time": "8:30:56", "throughput": 2510.95, "total_tokens": 989984} +{"current_steps": 1710, "total_steps": 134280, "loss": 0.643, "lr": 6.363568662496276e-06, "epoch": 0.2546916890080429, "percentage": 1.27, "elapsed_time": "0:06:35", "remaining_time": "8:30:56", "throughput": 2510.94, "total_tokens": 992896} +{"current_steps": 1715, "total_steps": 134280, "loss": 0.787, "lr": 6.382186476020256e-06, "epoch": 0.2554364015490021, "percentage": 1.28, "elapsed_time": "0:06:36", "remaining_time": "8:30:53", "throughput": 2510.91, "total_tokens": 995744} +{"current_steps": 1720, "total_steps": 134280, "loss": 0.7367, "lr": 6.400804289544236e-06, "epoch": 0.25618111408996125, "percentage": 1.28, "elapsed_time": "0:06:37", "remaining_time": "8:30:54", "throughput": 2510.97, "total_tokens": 998752} +{"current_steps": 1725, "total_steps": 134280, "loss": 0.8213, "lr": 6.419422103068217e-06, "epoch": 0.25692582663092045, "percentage": 1.28, "elapsed_time": "0:06:38", "remaining_time": "8:30:56", "throughput": 2511.08, "total_tokens": 1001792} +{"current_steps": 1730, "total_steps": 134280, "loss": 0.7455, "lr": 6.438039916592195e-06, "epoch": 0.25767053917187965, "percentage": 1.29, "elapsed_time": "0:06:40", "remaining_time": "8:30:53", "throughput": 2511.05, "total_tokens": 1004608} +{"current_steps": 1735, "total_steps": 134280, "loss": 0.6873, "lr": 6.456657730116175e-06, "epoch": 0.25841525171283886, "percentage": 1.29, "elapsed_time": "0:06:41", "remaining_time": "8:30:45", "throughput": 2510.85, "total_tokens": 1007232} +{"current_steps": 1740, "total_steps": 134280, "loss": 0.7692, "lr": 6.475275543640155e-06, "epoch": 0.25915996425379806, "percentage": 1.3, "elapsed_time": "0:06:42", "remaining_time": "8:30:48", "throughput": 2510.91, "total_tokens": 1010272} +{"current_steps": 1745, "total_steps": 134280, "loss": 0.7252, "lr": 6.493893357164136e-06, "epoch": 0.2599046767947572, "percentage": 1.3, "elapsed_time": "0:06:43", "remaining_time": "8:30:45", "throughput": 2510.66, "total_tokens": 1013024} +{"current_steps": 1750, "total_steps": 134280, "loss": 0.5701, "lr": 6.5125111706881156e-06, "epoch": 0.2606493893357164, "percentage": 1.3, "elapsed_time": "0:06:44", "remaining_time": "8:30:53", "throughput": 2510.73, "total_tokens": 1016256} +{"current_steps": 1755, "total_steps": 134280, "loss": 0.6309, "lr": 6.531128984212094e-06, "epoch": 0.2613941018766756, "percentage": 1.31, "elapsed_time": "0:06:45", "remaining_time": "8:30:53", "throughput": 2510.77, "total_tokens": 1019200} +{"current_steps": 1760, "total_steps": 134280, "loss": 0.812, "lr": 6.549746797736074e-06, "epoch": 0.2621388144176348, "percentage": 1.31, "elapsed_time": "0:06:47", "remaining_time": "8:30:47", "throughput": 2510.6, "total_tokens": 1021888} +{"current_steps": 1765, "total_steps": 134280, "loss": 0.8029, "lr": 6.5683646112600545e-06, "epoch": 0.26288352695859396, "percentage": 1.31, "elapsed_time": "0:06:48", "remaining_time": "8:30:49", "throughput": 2510.55, "total_tokens": 1024864} +{"current_steps": 1770, "total_steps": 134280, "loss": 0.5549, "lr": 6.5869824247840344e-06, "epoch": 0.26362823949955316, "percentage": 1.32, "elapsed_time": "0:06:49", "remaining_time": "8:30:44", "throughput": 2510.56, "total_tokens": 1027648} +{"current_steps": 1775, "total_steps": 134280, "loss": 0.8032, "lr": 6.605600238308013e-06, "epoch": 0.26437295204051237, "percentage": 1.32, "elapsed_time": "0:06:50", "remaining_time": "8:30:41", "throughput": 2510.53, "total_tokens": 1030496} +{"current_steps": 1780, "total_steps": 134280, "loss": 0.5858, "lr": 6.624218051831993e-06, "epoch": 0.26511766458147157, "percentage": 1.33, "elapsed_time": "0:06:51", "remaining_time": "8:30:46", "throughput": 2510.82, "total_tokens": 1033728} +{"current_steps": 1785, "total_steps": 134280, "loss": 0.8017, "lr": 6.642835865355973e-06, "epoch": 0.2658623771224307, "percentage": 1.33, "elapsed_time": "0:06:52", "remaining_time": "8:30:45", "throughput": 2510.95, "total_tokens": 1036672} +{"current_steps": 1790, "total_steps": 134280, "loss": 0.7291, "lr": 6.661453678879953e-06, "epoch": 0.2666070896633899, "percentage": 1.33, "elapsed_time": "0:06:54", "remaining_time": "8:30:49", "throughput": 2511.09, "total_tokens": 1039808} +{"current_steps": 1795, "total_steps": 134280, "loss": 0.6712, "lr": 6.6800714924039315e-06, "epoch": 0.2673518022043491, "percentage": 1.34, "elapsed_time": "0:06:55", "remaining_time": "8:30:48", "throughput": 2511.12, "total_tokens": 1042720} +{"current_steps": 1800, "total_steps": 134280, "loss": 0.6852, "lr": 6.6986893059279114e-06, "epoch": 0.2680965147453083, "percentage": 1.34, "elapsed_time": "0:06:56", "remaining_time": "8:30:45", "throughput": 2511.04, "total_tokens": 1045536} +{"current_steps": 1805, "total_steps": 134280, "loss": 0.7103, "lr": 6.717307119451892e-06, "epoch": 0.2688412272862675, "percentage": 1.34, "elapsed_time": "0:06:57", "remaining_time": "8:30:41", "throughput": 2511.16, "total_tokens": 1048384} +{"current_steps": 1810, "total_steps": 134280, "loss": 0.8036, "lr": 6.735924932975872e-06, "epoch": 0.2695859398272267, "percentage": 1.35, "elapsed_time": "0:06:58", "remaining_time": "8:30:36", "throughput": 2511.16, "total_tokens": 1051168} +{"current_steps": 1815, "total_steps": 134280, "loss": 0.6791, "lr": 6.754542746499852e-06, "epoch": 0.2703306523681859, "percentage": 1.35, "elapsed_time": "0:06:59", "remaining_time": "8:30:31", "throughput": 2511.17, "total_tokens": 1053952} +{"current_steps": 1820, "total_steps": 134280, "loss": 0.6089, "lr": 6.77316056002383e-06, "epoch": 0.2710753649091451, "percentage": 1.36, "elapsed_time": "0:07:00", "remaining_time": "8:30:34", "throughput": 2511.32, "total_tokens": 1057056} +{"current_steps": 1825, "total_steps": 134280, "loss": 0.6824, "lr": 6.791778373547811e-06, "epoch": 0.2718200774501043, "percentage": 1.36, "elapsed_time": "0:07:02", "remaining_time": "8:30:31", "throughput": 2511.44, "total_tokens": 1059968} +{"current_steps": 1830, "total_steps": 134280, "loss": 0.7679, "lr": 6.810396187071791e-06, "epoch": 0.2725647899910634, "percentage": 1.36, "elapsed_time": "0:07:03", "remaining_time": "8:30:35", "throughput": 2511.37, "total_tokens": 1063008} +{"current_steps": 1835, "total_steps": 134280, "loss": 0.6196, "lr": 6.829014000595771e-06, "epoch": 0.27330950253202263, "percentage": 1.37, "elapsed_time": "0:07:04", "remaining_time": "8:30:31", "throughput": 2511.18, "total_tokens": 1065728} +{"current_steps": 1840, "total_steps": 134280, "loss": 0.6019, "lr": 6.847631814119749e-06, "epoch": 0.27405421507298183, "percentage": 1.37, "elapsed_time": "0:07:05", "remaining_time": "8:30:28", "throughput": 2511.25, "total_tokens": 1068608} +{"current_steps": 1845, "total_steps": 134280, "loss": 0.5993, "lr": 6.86624962764373e-06, "epoch": 0.27479892761394104, "percentage": 1.37, "elapsed_time": "0:07:06", "remaining_time": "8:30:28", "throughput": 2511.29, "total_tokens": 1071552} +{"current_steps": 1850, "total_steps": 134280, "loss": 0.6483, "lr": 6.88486744116771e-06, "epoch": 0.2755436401549002, "percentage": 1.38, "elapsed_time": "0:07:07", "remaining_time": "8:30:25", "throughput": 2511.26, "total_tokens": 1074400} +{"current_steps": 1855, "total_steps": 134280, "loss": 0.5849, "lr": 6.90348525469169e-06, "epoch": 0.2762883526958594, "percentage": 1.38, "elapsed_time": "0:07:09", "remaining_time": "8:30:29", "throughput": 2511.2, "total_tokens": 1077440} +{"current_steps": 1860, "total_steps": 134280, "loss": 0.7938, "lr": 6.922103068215669e-06, "epoch": 0.2770330652368186, "percentage": 1.39, "elapsed_time": "0:07:10", "remaining_time": "8:30:33", "throughput": 2511.33, "total_tokens": 1080576} +{"current_steps": 1865, "total_steps": 134280, "loss": 0.6256, "lr": 6.940720881739649e-06, "epoch": 0.2777777777777778, "percentage": 1.39, "elapsed_time": "0:07:11", "remaining_time": "8:30:34", "throughput": 2511.44, "total_tokens": 1083616} +{"current_steps": 1870, "total_steps": 134280, "loss": 0.8134, "lr": 6.959338695263629e-06, "epoch": 0.278522490318737, "percentage": 1.39, "elapsed_time": "0:07:12", "remaining_time": "8:30:36", "throughput": 2511.43, "total_tokens": 1086624} +{"current_steps": 1875, "total_steps": 134280, "loss": 0.7763, "lr": 6.977956508787609e-06, "epoch": 0.27926720285969614, "percentage": 1.4, "elapsed_time": "0:07:13", "remaining_time": "8:30:36", "throughput": 2511.57, "total_tokens": 1089632} +{"current_steps": 1880, "total_steps": 134280, "loss": 0.6827, "lr": 6.9965743223115886e-06, "epoch": 0.28001191540065534, "percentage": 1.4, "elapsed_time": "0:07:14", "remaining_time": "8:30:33", "throughput": 2511.63, "total_tokens": 1092512} +{"current_steps": 1885, "total_steps": 134280, "loss": 0.6614, "lr": 7.015192135835568e-06, "epoch": 0.28075662794161454, "percentage": 1.4, "elapsed_time": "0:07:16", "remaining_time": "8:30:33", "throughput": 2511.71, "total_tokens": 1095488} +{"current_steps": 1890, "total_steps": 134280, "loss": 0.7045, "lr": 7.033809949359548e-06, "epoch": 0.28150134048257375, "percentage": 1.41, "elapsed_time": "0:07:17", "remaining_time": "8:30:27", "throughput": 2511.65, "total_tokens": 1098176} +{"current_steps": 1895, "total_steps": 134280, "loss": 0.6022, "lr": 7.0524277628835275e-06, "epoch": 0.2822460530235329, "percentage": 1.41, "elapsed_time": "0:07:18", "remaining_time": "8:30:29", "throughput": 2511.85, "total_tokens": 1101312} +{"current_steps": 1900, "total_steps": 134280, "loss": 0.633, "lr": 7.0710455764075074e-06, "epoch": 0.2829907655644921, "percentage": 1.41, "elapsed_time": "0:07:19", "remaining_time": "8:30:33", "throughput": 2512.03, "total_tokens": 1104480} +{"current_steps": 1905, "total_steps": 134280, "loss": 0.669, "lr": 7.0896633899314865e-06, "epoch": 0.2837354781054513, "percentage": 1.42, "elapsed_time": "0:07:20", "remaining_time": "8:30:32", "throughput": 2512.15, "total_tokens": 1107424} +{"current_steps": 1910, "total_steps": 134280, "loss": 0.6622, "lr": 7.1082812034554664e-06, "epoch": 0.2844801906464105, "percentage": 1.42, "elapsed_time": "0:07:21", "remaining_time": "8:30:27", "throughput": 2511.99, "total_tokens": 1110112} +{"current_steps": 1915, "total_steps": 134280, "loss": 0.9668, "lr": 7.126899016979446e-06, "epoch": 0.28522490318736965, "percentage": 1.43, "elapsed_time": "0:07:23", "remaining_time": "8:30:27", "throughput": 2512.12, "total_tokens": 1113120} +{"current_steps": 1920, "total_steps": 134280, "loss": 0.834, "lr": 7.145516830503426e-06, "epoch": 0.28596961572832885, "percentage": 1.43, "elapsed_time": "0:07:24", "remaining_time": "8:30:23", "throughput": 2512.04, "total_tokens": 1115904} +{"current_steps": 1925, "total_steps": 134280, "loss": 0.5743, "lr": 7.164134644027405e-06, "epoch": 0.28671432826928805, "percentage": 1.43, "elapsed_time": "0:07:25", "remaining_time": "8:30:23", "throughput": 2512.12, "total_tokens": 1118880} +{"current_steps": 1930, "total_steps": 134280, "loss": 0.7336, "lr": 7.182752457551385e-06, "epoch": 0.28745904081024726, "percentage": 1.44, "elapsed_time": "0:07:26", "remaining_time": "8:30:24", "throughput": 2512.3, "total_tokens": 1121952} +{"current_steps": 1935, "total_steps": 134280, "loss": 0.5489, "lr": 7.201370271075365e-06, "epoch": 0.28820375335120646, "percentage": 1.44, "elapsed_time": "0:07:27", "remaining_time": "8:30:20", "throughput": 2512.17, "total_tokens": 1124704} +{"current_steps": 1940, "total_steps": 134280, "loss": 0.6982, "lr": 7.219988084599345e-06, "epoch": 0.2889484658921656, "percentage": 1.44, "elapsed_time": "0:07:28", "remaining_time": "8:30:15", "throughput": 2512.12, "total_tokens": 1127456} +{"current_steps": 1945, "total_steps": 134280, "loss": 0.7101, "lr": 7.238605898123325e-06, "epoch": 0.2896931784331248, "percentage": 1.45, "elapsed_time": "0:07:30", "remaining_time": "8:30:25", "throughput": 2512.2, "total_tokens": 1130784} +{"current_steps": 1950, "total_steps": 134280, "loss": 0.6641, "lr": 7.257223711647304e-06, "epoch": 0.290437890974084, "percentage": 1.45, "elapsed_time": "0:07:31", "remaining_time": "8:30:24", "throughput": 2512.36, "total_tokens": 1133760} +{"current_steps": 1955, "total_steps": 134280, "loss": 0.7232, "lr": 7.275841525171284e-06, "epoch": 0.2911826035150432, "percentage": 1.46, "elapsed_time": "0:07:32", "remaining_time": "8:30:21", "throughput": 2512.43, "total_tokens": 1136640} +{"current_steps": 1960, "total_steps": 134280, "loss": 0.6186, "lr": 7.294459338695264e-06, "epoch": 0.29192731605600236, "percentage": 1.46, "elapsed_time": "0:07:33", "remaining_time": "8:30:23", "throughput": 2512.57, "total_tokens": 1139744} +{"current_steps": 1965, "total_steps": 134280, "loss": 0.6067, "lr": 7.313077152219244e-06, "epoch": 0.29267202859696156, "percentage": 1.46, "elapsed_time": "0:07:34", "remaining_time": "8:30:22", "throughput": 2512.65, "total_tokens": 1142688} +{"current_steps": 1970, "total_steps": 134280, "loss": 0.7507, "lr": 7.331694965743223e-06, "epoch": 0.29341674113792077, "percentage": 1.47, "elapsed_time": "0:07:36", "remaining_time": "8:30:27", "throughput": 2512.68, "total_tokens": 1145824} +{"current_steps": 1975, "total_steps": 134280, "loss": 0.671, "lr": 7.350312779267203e-06, "epoch": 0.29416145367887997, "percentage": 1.47, "elapsed_time": "0:07:37", "remaining_time": "8:30:23", "throughput": 2512.49, "total_tokens": 1148544} +{"current_steps": 1980, "total_steps": 134280, "loss": 0.7425, "lr": 7.368930592791183e-06, "epoch": 0.2949061662198391, "percentage": 1.47, "elapsed_time": "0:07:38", "remaining_time": "8:30:19", "throughput": 2512.41, "total_tokens": 1151328} +{"current_steps": 1985, "total_steps": 134280, "loss": 0.5964, "lr": 7.387548406315163e-06, "epoch": 0.2956508787607983, "percentage": 1.48, "elapsed_time": "0:07:39", "remaining_time": "8:30:12", "throughput": 2512.33, "total_tokens": 1153952} +{"current_steps": 1990, "total_steps": 134280, "loss": 0.6658, "lr": 7.406166219839142e-06, "epoch": 0.2963955913017575, "percentage": 1.48, "elapsed_time": "0:07:40", "remaining_time": "8:30:09", "throughput": 2512.3, "total_tokens": 1156800} +{"current_steps": 1995, "total_steps": 134280, "loss": 0.6409, "lr": 7.424784033363122e-06, "epoch": 0.2971403038427167, "percentage": 1.49, "elapsed_time": "0:07:41", "remaining_time": "8:30:10", "throughput": 2512.34, "total_tokens": 1159808} +{"current_steps": 2000, "total_steps": 134280, "loss": 0.6461, "lr": 7.443401846887102e-06, "epoch": 0.2978850163836759, "percentage": 1.49, "elapsed_time": "0:07:42", "remaining_time": "8:30:12", "throughput": 2512.39, "total_tokens": 1162848} +{"current_steps": 2005, "total_steps": 134280, "loss": 0.7766, "lr": 7.462019660411082e-06, "epoch": 0.2986297289246351, "percentage": 1.49, "elapsed_time": "0:07:44", "remaining_time": "8:30:18", "throughput": 2512.79, "total_tokens": 1166208} +{"current_steps": 2010, "total_steps": 134280, "loss": 0.9582, "lr": 7.480637473935062e-06, "epoch": 0.2993744414655943, "percentage": 1.5, "elapsed_time": "0:07:45", "remaining_time": "8:30:13", "throughput": 2512.69, "total_tokens": 1168928} +{"current_steps": 2015, "total_steps": 134280, "loss": 0.6962, "lr": 7.499255287459041e-06, "epoch": 0.3001191540065535, "percentage": 1.5, "elapsed_time": "0:07:46", "remaining_time": "8:30:11", "throughput": 2512.51, "total_tokens": 1171712} +{"current_steps": 2020, "total_steps": 134280, "loss": 0.5611, "lr": 7.517873100983021e-06, "epoch": 0.3008638665475127, "percentage": 1.5, "elapsed_time": "0:07:47", "remaining_time": "8:30:07", "throughput": 2512.19, "total_tokens": 1174368} +{"current_steps": 2025, "total_steps": 134280, "loss": 0.5905, "lr": 7.5364909145070005e-06, "epoch": 0.30160857908847183, "percentage": 1.51, "elapsed_time": "0:07:48", "remaining_time": "8:30:04", "throughput": 2512.15, "total_tokens": 1177184} +{"current_steps": 2030, "total_steps": 134280, "loss": 0.7516, "lr": 7.555108728030981e-06, "epoch": 0.30235329162943103, "percentage": 1.51, "elapsed_time": "0:07:49", "remaining_time": "8:30:00", "throughput": 2511.93, "total_tokens": 1179872} +{"current_steps": 2035, "total_steps": 134280, "loss": 0.8054, "lr": 7.5737265415549595e-06, "epoch": 0.30309800417039023, "percentage": 1.52, "elapsed_time": "0:07:50", "remaining_time": "8:29:53", "throughput": 2511.72, "total_tokens": 1182464} +{"current_steps": 2040, "total_steps": 134280, "loss": 0.8172, "lr": 7.5923443550789394e-06, "epoch": 0.30384271671134944, "percentage": 1.52, "elapsed_time": "0:07:51", "remaining_time": "8:29:56", "throughput": 2511.96, "total_tokens": 1185632} +{"current_steps": 2045, "total_steps": 134280, "loss": 0.65, "lr": 7.610962168602919e-06, "epoch": 0.3045874292523086, "percentage": 1.52, "elapsed_time": "0:07:53", "remaining_time": "8:29:52", "throughput": 2511.95, "total_tokens": 1188416} +{"current_steps": 2050, "total_steps": 134280, "loss": 0.7271, "lr": 7.6295799821269e-06, "epoch": 0.3053321417932678, "percentage": 1.53, "elapsed_time": "0:07:54", "remaining_time": "8:29:58", "throughput": 2511.99, "total_tokens": 1191648} +{"current_steps": 2055, "total_steps": 134280, "loss": 0.6954, "lr": 7.64819779565088e-06, "epoch": 0.306076854334227, "percentage": 1.53, "elapsed_time": "0:07:55", "remaining_time": "8:29:56", "throughput": 2511.87, "total_tokens": 1194432} +{"current_steps": 2060, "total_steps": 134280, "loss": 0.663, "lr": 7.666815609174859e-06, "epoch": 0.3068215668751862, "percentage": 1.53, "elapsed_time": "0:07:56", "remaining_time": "8:29:52", "throughput": 2511.92, "total_tokens": 1197248} +{"current_steps": 2065, "total_steps": 134280, "loss": 0.7533, "lr": 7.685433422698839e-06, "epoch": 0.3075662794161454, "percentage": 1.54, "elapsed_time": "0:07:57", "remaining_time": "8:29:53", "throughput": 2511.96, "total_tokens": 1200256} +{"current_steps": 2070, "total_steps": 134280, "loss": 0.765, "lr": 7.704051236222819e-06, "epoch": 0.30831099195710454, "percentage": 1.54, "elapsed_time": "0:07:58", "remaining_time": "8:29:48", "throughput": 2511.95, "total_tokens": 1203040} +{"current_steps": 2075, "total_steps": 134280, "loss": 0.7001, "lr": 7.722669049746799e-06, "epoch": 0.30905570449806374, "percentage": 1.55, "elapsed_time": "0:08:00", "remaining_time": "8:29:49", "throughput": 2512.05, "total_tokens": 1206080} +{"current_steps": 2080, "total_steps": 134280, "loss": 0.6192, "lr": 7.741286863270777e-06, "epoch": 0.30980041703902295, "percentage": 1.55, "elapsed_time": "0:08:01", "remaining_time": "8:29:42", "throughput": 2511.98, "total_tokens": 1208704} +{"current_steps": 2085, "total_steps": 134280, "loss": 0.6325, "lr": 7.759904676794757e-06, "epoch": 0.31054512957998215, "percentage": 1.55, "elapsed_time": "0:08:02", "remaining_time": "8:29:38", "throughput": 2511.84, "total_tokens": 1211424} +{"current_steps": 2090, "total_steps": 134280, "loss": 0.5324, "lr": 7.778522490318737e-06, "epoch": 0.3112898421209413, "percentage": 1.56, "elapsed_time": "0:08:03", "remaining_time": "8:29:37", "throughput": 2511.73, "total_tokens": 1214272} +{"current_steps": 2095, "total_steps": 134280, "loss": 0.7774, "lr": 7.797140303842717e-06, "epoch": 0.3120345546619005, "percentage": 1.56, "elapsed_time": "0:08:04", "remaining_time": "8:29:36", "throughput": 2511.86, "total_tokens": 1217280} +{"current_steps": 2100, "total_steps": 134280, "loss": 0.6934, "lr": 7.815758117366697e-06, "epoch": 0.3127792672028597, "percentage": 1.56, "elapsed_time": "0:08:05", "remaining_time": "8:29:33", "throughput": 2511.78, "total_tokens": 1220064} +{"current_steps": 2105, "total_steps": 134280, "loss": 0.553, "lr": 7.834375930890677e-06, "epoch": 0.3135239797438189, "percentage": 1.57, "elapsed_time": "0:08:06", "remaining_time": "8:29:30", "throughput": 2511.7, "total_tokens": 1222848} +{"current_steps": 2110, "total_steps": 134280, "loss": 0.6961, "lr": 7.852993744414657e-06, "epoch": 0.31426869228477805, "percentage": 1.57, "elapsed_time": "0:08:08", "remaining_time": "8:29:30", "throughput": 2511.6, "total_tokens": 1225760} +{"current_steps": 2115, "total_steps": 134280, "loss": 0.7146, "lr": 7.871611557938637e-06, "epoch": 0.31501340482573725, "percentage": 1.58, "elapsed_time": "0:08:09", "remaining_time": "8:29:32", "throughput": 2511.74, "total_tokens": 1228864} +{"current_steps": 2120, "total_steps": 134280, "loss": 0.6969, "lr": 7.890229371462615e-06, "epoch": 0.31575811736669646, "percentage": 1.58, "elapsed_time": "0:08:10", "remaining_time": "8:29:30", "throughput": 2511.76, "total_tokens": 1231712} +{"current_steps": 2125, "total_steps": 134280, "loss": 0.615, "lr": 7.908847184986595e-06, "epoch": 0.31650282990765566, "percentage": 1.58, "elapsed_time": "0:08:11", "remaining_time": "8:29:31", "throughput": 2511.76, "total_tokens": 1234720} +{"current_steps": 2130, "total_steps": 134280, "loss": 0.6922, "lr": 7.927464998510575e-06, "epoch": 0.31724754244861486, "percentage": 1.59, "elapsed_time": "0:08:12", "remaining_time": "8:29:28", "throughput": 2511.63, "total_tokens": 1237504} +{"current_steps": 2135, "total_steps": 134280, "loss": 0.7255, "lr": 7.946082812034555e-06, "epoch": 0.317992254989574, "percentage": 1.59, "elapsed_time": "0:08:13", "remaining_time": "8:29:24", "throughput": 2511.57, "total_tokens": 1240256} +{"current_steps": 2140, "total_steps": 134280, "loss": 0.7943, "lr": 7.964700625558536e-06, "epoch": 0.3187369675305332, "percentage": 1.59, "elapsed_time": "0:08:15", "remaining_time": "8:29:26", "throughput": 2511.57, "total_tokens": 1243264} +{"current_steps": 2145, "total_steps": 134280, "loss": 0.7047, "lr": 7.983318439082515e-06, "epoch": 0.3194816800714924, "percentage": 1.6, "elapsed_time": "0:08:16", "remaining_time": "8:29:26", "throughput": 2511.72, "total_tokens": 1246304} +{"current_steps": 2150, "total_steps": 134280, "loss": 0.7241, "lr": 8.001936252606494e-06, "epoch": 0.3202263926124516, "percentage": 1.6, "elapsed_time": "0:08:17", "remaining_time": "8:29:23", "throughput": 2511.78, "total_tokens": 1249184} +{"current_steps": 2155, "total_steps": 134280, "loss": 0.7714, "lr": 8.020554066130474e-06, "epoch": 0.32097110515341076, "percentage": 1.6, "elapsed_time": "0:08:18", "remaining_time": "8:29:21", "throughput": 2511.84, "total_tokens": 1252064} +{"current_steps": 2160, "total_steps": 134280, "loss": 0.6725, "lr": 8.039171879654454e-06, "epoch": 0.32171581769436997, "percentage": 1.61, "elapsed_time": "0:08:19", "remaining_time": "8:29:24", "throughput": 2511.95, "total_tokens": 1255200} +{"current_steps": 2165, "total_steps": 134280, "loss": 0.6715, "lr": 8.057789693178433e-06, "epoch": 0.32246053023532917, "percentage": 1.61, "elapsed_time": "0:08:20", "remaining_time": "8:29:21", "throughput": 2511.97, "total_tokens": 1258048} +{"current_steps": 2170, "total_steps": 134280, "loss": 0.6373, "lr": 8.076407506702412e-06, "epoch": 0.32320524277628837, "percentage": 1.62, "elapsed_time": "0:08:21", "remaining_time": "8:29:20", "throughput": 2512.09, "total_tokens": 1261024} +{"current_steps": 2175, "total_steps": 134280, "loss": 0.6775, "lr": 8.095025320226392e-06, "epoch": 0.3239499553172475, "percentage": 1.62, "elapsed_time": "0:08:23", "remaining_time": "8:29:18", "throughput": 2512.1, "total_tokens": 1263872} +{"current_steps": 2180, "total_steps": 134280, "loss": 0.6783, "lr": 8.113643133750374e-06, "epoch": 0.3246946678582067, "percentage": 1.62, "elapsed_time": "0:08:24", "remaining_time": "8:29:21", "throughput": 2512.03, "total_tokens": 1266912} +{"current_steps": 2185, "total_steps": 134280, "loss": 0.6958, "lr": 8.132260947274352e-06, "epoch": 0.3254393803991659, "percentage": 1.63, "elapsed_time": "0:08:25", "remaining_time": "8:29:18", "throughput": 2512.0, "total_tokens": 1269728} +{"current_steps": 2190, "total_steps": 134280, "loss": 0.6768, "lr": 8.150878760798332e-06, "epoch": 0.3261840929401251, "percentage": 1.63, "elapsed_time": "0:08:26", "remaining_time": "8:29:13", "throughput": 2511.87, "total_tokens": 1272416} +{"current_steps": 2195, "total_steps": 134280, "loss": 0.7732, "lr": 8.169496574322312e-06, "epoch": 0.32692880548108433, "percentage": 1.63, "elapsed_time": "0:08:27", "remaining_time": "8:29:17", "throughput": 2511.9, "total_tokens": 1275552} +{"current_steps": 2200, "total_steps": 134280, "loss": 0.6619, "lr": 8.188114387846292e-06, "epoch": 0.3276735180220435, "percentage": 1.64, "elapsed_time": "0:08:29", "remaining_time": "8:29:20", "throughput": 2512.09, "total_tokens": 1278752} +{"current_steps": 2205, "total_steps": 134280, "loss": 0.8571, "lr": 8.206732201370272e-06, "epoch": 0.3284182305630027, "percentage": 1.64, "elapsed_time": "0:08:30", "remaining_time": "8:29:20", "throughput": 2512.13, "total_tokens": 1281728} +{"current_steps": 2210, "total_steps": 134280, "loss": 0.6345, "lr": 8.22535001489425e-06, "epoch": 0.3291629431039619, "percentage": 1.65, "elapsed_time": "0:08:31", "remaining_time": "8:29:19", "throughput": 2512.06, "total_tokens": 1284608} +{"current_steps": 2215, "total_steps": 134280, "loss": 0.6281, "lr": 8.24396782841823e-06, "epoch": 0.3299076556449211, "percentage": 1.65, "elapsed_time": "0:08:32", "remaining_time": "8:29:20", "throughput": 2512.18, "total_tokens": 1287648} +{"current_steps": 2220, "total_steps": 134280, "loss": 0.6718, "lr": 8.262585641942212e-06, "epoch": 0.33065236818588023, "percentage": 1.65, "elapsed_time": "0:08:33", "remaining_time": "8:29:17", "throughput": 2512.19, "total_tokens": 1290496} +{"current_steps": 2225, "total_steps": 134280, "loss": 0.4959, "lr": 8.281203455466192e-06, "epoch": 0.33139708072683943, "percentage": 1.66, "elapsed_time": "0:08:34", "remaining_time": "8:29:15", "throughput": 2512.17, "total_tokens": 1293344} +{"current_steps": 2230, "total_steps": 134280, "loss": 0.6333, "lr": 8.29982126899017e-06, "epoch": 0.33214179326779864, "percentage": 1.66, "elapsed_time": "0:08:35", "remaining_time": "8:29:12", "throughput": 2512.18, "total_tokens": 1296192} +{"current_steps": 2235, "total_steps": 134280, "loss": 0.7225, "lr": 8.31843908251415e-06, "epoch": 0.33288650580875784, "percentage": 1.66, "elapsed_time": "0:08:37", "remaining_time": "8:29:07", "throughput": 2512.01, "total_tokens": 1298848} +{"current_steps": 2240, "total_steps": 134280, "loss": 0.8125, "lr": 8.33705689603813e-06, "epoch": 0.333631218349717, "percentage": 1.67, "elapsed_time": "0:08:38", "remaining_time": "8:29:04", "throughput": 2511.8, "total_tokens": 1301536} +{"current_steps": 2245, "total_steps": 134280, "loss": 0.7063, "lr": 8.35567470956211e-06, "epoch": 0.3343759308906762, "percentage": 1.67, "elapsed_time": "0:08:39", "remaining_time": "8:29:02", "throughput": 2511.86, "total_tokens": 1304448} +{"current_steps": 2250, "total_steps": 134280, "loss": 0.6993, "lr": 8.374292523086088e-06, "epoch": 0.3351206434316354, "percentage": 1.68, "elapsed_time": "0:08:40", "remaining_time": "8:29:00", "throughput": 2511.84, "total_tokens": 1307328} +{"current_steps": 2255, "total_steps": 134280, "loss": 0.6156, "lr": 8.392910336610068e-06, "epoch": 0.3358653559725946, "percentage": 1.68, "elapsed_time": "0:08:41", "remaining_time": "8:29:01", "throughput": 2511.94, "total_tokens": 1310368} +{"current_steps": 2260, "total_steps": 134280, "loss": 0.7141, "lr": 8.41152815013405e-06, "epoch": 0.3366100685135538, "percentage": 1.68, "elapsed_time": "0:08:42", "remaining_time": "8:28:59", "throughput": 2511.95, "total_tokens": 1313216} +{"current_steps": 2265, "total_steps": 134280, "loss": 0.6993, "lr": 8.43014596365803e-06, "epoch": 0.33735478105451294, "percentage": 1.69, "elapsed_time": "0:08:43", "remaining_time": "8:29:00", "throughput": 2512.0, "total_tokens": 1316256} +{"current_steps": 2270, "total_steps": 134280, "loss": 0.7551, "lr": 8.44876377718201e-06, "epoch": 0.33809949359547214, "percentage": 1.69, "elapsed_time": "0:08:45", "remaining_time": "8:28:56", "throughput": 2511.92, "total_tokens": 1318976} +{"current_steps": 2275, "total_steps": 134280, "loss": 0.8564, "lr": 8.467381590705988e-06, "epoch": 0.33884420613643135, "percentage": 1.69, "elapsed_time": "0:08:46", "remaining_time": "8:28:50", "throughput": 2511.82, "total_tokens": 1321632} +{"current_steps": 2280, "total_steps": 134280, "loss": 0.6687, "lr": 8.485999404229967e-06, "epoch": 0.33958891867739055, "percentage": 1.7, "elapsed_time": "0:08:47", "remaining_time": "8:28:44", "throughput": 2511.69, "total_tokens": 1324256} +{"current_steps": 2285, "total_steps": 134280, "loss": 0.6858, "lr": 8.504617217753947e-06, "epoch": 0.3403336312183497, "percentage": 1.7, "elapsed_time": "0:08:48", "remaining_time": "8:28:40", "throughput": 2511.57, "total_tokens": 1327008} +{"current_steps": 2290, "total_steps": 134280, "loss": 0.7577, "lr": 8.523235031277927e-06, "epoch": 0.3410783437593089, "percentage": 1.71, "elapsed_time": "0:08:49", "remaining_time": "8:28:40", "throughput": 2511.73, "total_tokens": 1330016} +{"current_steps": 2295, "total_steps": 134280, "loss": 0.7116, "lr": 8.541852844801907e-06, "epoch": 0.3418230563002681, "percentage": 1.71, "elapsed_time": "0:08:50", "remaining_time": "8:28:40", "throughput": 2511.84, "total_tokens": 1333024} +{"current_steps": 2300, "total_steps": 134280, "loss": 0.6528, "lr": 8.560470658325887e-06, "epoch": 0.3425677688412273, "percentage": 1.71, "elapsed_time": "0:08:51", "remaining_time": "8:28:36", "throughput": 2511.93, "total_tokens": 1335872} +{"current_steps": 2305, "total_steps": 134280, "loss": 0.7516, "lr": 8.579088471849867e-06, "epoch": 0.34331248138218645, "percentage": 1.72, "elapsed_time": "0:08:52", "remaining_time": "8:28:31", "throughput": 2511.87, "total_tokens": 1338560} +{"current_steps": 2310, "total_steps": 134280, "loss": 0.6852, "lr": 8.597706285373847e-06, "epoch": 0.34405719392314565, "percentage": 1.72, "elapsed_time": "0:08:53", "remaining_time": "8:28:26", "throughput": 2511.75, "total_tokens": 1341248} +{"current_steps": 2315, "total_steps": 134280, "loss": 0.6583, "lr": 8.616324098897825e-06, "epoch": 0.34480190646410486, "percentage": 1.72, "elapsed_time": "0:08:55", "remaining_time": "8:28:22", "throughput": 2511.63, "total_tokens": 1343936} +{"current_steps": 2320, "total_steps": 134280, "loss": 0.6455, "lr": 8.634941912421805e-06, "epoch": 0.34554661900506406, "percentage": 1.73, "elapsed_time": "0:08:56", "remaining_time": "8:28:21", "throughput": 2511.66, "total_tokens": 1346880} +{"current_steps": 2325, "total_steps": 134280, "loss": 0.6353, "lr": 8.653559725945785e-06, "epoch": 0.34629133154602326, "percentage": 1.73, "elapsed_time": "0:08:57", "remaining_time": "8:28:20", "throughput": 2511.75, "total_tokens": 1349824} +{"current_steps": 2330, "total_steps": 134280, "loss": 0.6618, "lr": 8.672177539469765e-06, "epoch": 0.3470360440869824, "percentage": 1.74, "elapsed_time": "0:08:58", "remaining_time": "8:28:17", "throughput": 2511.64, "total_tokens": 1352576} +{"current_steps": 2335, "total_steps": 134280, "loss": 0.6884, "lr": 8.690795352993745e-06, "epoch": 0.3477807566279416, "percentage": 1.74, "elapsed_time": "0:08:59", "remaining_time": "8:28:22", "throughput": 2511.83, "total_tokens": 1355872} +{"current_steps": 2340, "total_steps": 134280, "loss": 0.6204, "lr": 8.709413166517725e-06, "epoch": 0.3485254691689008, "percentage": 1.74, "elapsed_time": "0:09:00", "remaining_time": "8:28:21", "throughput": 2511.92, "total_tokens": 1358816} +{"current_steps": 2345, "total_steps": 134280, "loss": 0.6557, "lr": 8.728030980041705e-06, "epoch": 0.34927018170986, "percentage": 1.75, "elapsed_time": "0:09:02", "remaining_time": "8:28:26", "throughput": 2512.15, "total_tokens": 1362144} +{"current_steps": 2350, "total_steps": 134280, "loss": 0.5517, "lr": 8.746648793565685e-06, "epoch": 0.35001489425081916, "percentage": 1.75, "elapsed_time": "0:09:03", "remaining_time": "8:28:27", "throughput": 2512.14, "total_tokens": 1365120} +{"current_steps": 2355, "total_steps": 134280, "loss": 0.8255, "lr": 8.765266607089665e-06, "epoch": 0.35075960679177837, "percentage": 1.75, "elapsed_time": "0:09:04", "remaining_time": "8:28:28", "throughput": 2512.26, "total_tokens": 1368192} +{"current_steps": 2360, "total_steps": 134280, "loss": 0.7346, "lr": 8.783884420613643e-06, "epoch": 0.35150431933273757, "percentage": 1.76, "elapsed_time": "0:09:05", "remaining_time": "8:28:28", "throughput": 2512.37, "total_tokens": 1371200} +{"current_steps": 2365, "total_steps": 134280, "loss": 0.6487, "lr": 8.802502234137623e-06, "epoch": 0.35224903187369677, "percentage": 1.76, "elapsed_time": "0:09:06", "remaining_time": "8:28:27", "throughput": 2512.36, "total_tokens": 1374112} +{"current_steps": 2370, "total_steps": 134280, "loss": 0.8774, "lr": 8.821120047661603e-06, "epoch": 0.3529937444146559, "percentage": 1.76, "elapsed_time": "0:09:08", "remaining_time": "8:28:20", "throughput": 2512.1, "total_tokens": 1376640} +{"current_steps": 2375, "total_steps": 134280, "loss": 0.7953, "lr": 8.839737861185583e-06, "epoch": 0.3537384569556151, "percentage": 1.77, "elapsed_time": "0:09:09", "remaining_time": "8:28:20", "throughput": 2512.13, "total_tokens": 1379616} +{"current_steps": 2380, "total_steps": 134280, "loss": 0.941, "lr": 8.858355674709563e-06, "epoch": 0.3544831694965743, "percentage": 1.77, "elapsed_time": "0:09:10", "remaining_time": "8:28:28", "throughput": 2510.99, "total_tokens": 1382304} +{"current_steps": 2385, "total_steps": 134280, "loss": 0.6749, "lr": 8.876973488233543e-06, "epoch": 0.3552278820375335, "percentage": 1.78, "elapsed_time": "0:09:11", "remaining_time": "8:28:26", "throughput": 2511.04, "total_tokens": 1385184} +{"current_steps": 2390, "total_steps": 134280, "loss": 0.6785, "lr": 8.895591301757522e-06, "epoch": 0.35597259457849273, "percentage": 1.78, "elapsed_time": "0:09:12", "remaining_time": "8:28:28", "throughput": 2511.08, "total_tokens": 1388224} +{"current_steps": 2395, "total_steps": 134280, "loss": 0.6693, "lr": 8.914209115281502e-06, "epoch": 0.3567173071194519, "percentage": 1.78, "elapsed_time": "0:09:13", "remaining_time": "8:28:24", "throughput": 2511.12, "total_tokens": 1391040} +{"current_steps": 2400, "total_steps": 134280, "loss": 0.7053, "lr": 8.93282692880548e-06, "epoch": 0.3574620196604111, "percentage": 1.79, "elapsed_time": "0:09:15", "remaining_time": "8:28:19", "throughput": 2511.15, "total_tokens": 1393792} +{"current_steps": 2405, "total_steps": 134280, "loss": 0.7499, "lr": 8.95144474232946e-06, "epoch": 0.3582067322013703, "percentage": 1.79, "elapsed_time": "0:09:16", "remaining_time": "8:28:16", "throughput": 2511.09, "total_tokens": 1396576} +{"current_steps": 2410, "total_steps": 134280, "loss": 0.7237, "lr": 8.97006255585344e-06, "epoch": 0.3589514447423295, "percentage": 1.79, "elapsed_time": "0:09:17", "remaining_time": "8:28:16", "throughput": 2511.09, "total_tokens": 1399552} +{"current_steps": 2415, "total_steps": 134280, "loss": 0.5462, "lr": 8.98868036937742e-06, "epoch": 0.35969615728328863, "percentage": 1.8, "elapsed_time": "0:09:18", "remaining_time": "8:28:13", "throughput": 2511.13, "total_tokens": 1402368} +{"current_steps": 2420, "total_steps": 134280, "loss": 0.668, "lr": 9.0072981829014e-06, "epoch": 0.36044086982424783, "percentage": 1.8, "elapsed_time": "0:09:19", "remaining_time": "8:28:14", "throughput": 2511.08, "total_tokens": 1405344} +{"current_steps": 2425, "total_steps": 134280, "loss": 0.6697, "lr": 9.02591599642538e-06, "epoch": 0.36118558236520704, "percentage": 1.81, "elapsed_time": "0:09:20", "remaining_time": "8:28:11", "throughput": 2510.94, "total_tokens": 1408064} +{"current_steps": 2430, "total_steps": 134280, "loss": 0.7015, "lr": 9.04453380994936e-06, "epoch": 0.36193029490616624, "percentage": 1.81, "elapsed_time": "0:09:21", "remaining_time": "8:28:09", "throughput": 2510.95, "total_tokens": 1410944} +{"current_steps": 2435, "total_steps": 134280, "loss": 0.679, "lr": 9.06315162347334e-06, "epoch": 0.3626750074471254, "percentage": 1.81, "elapsed_time": "0:09:23", "remaining_time": "8:28:09", "throughput": 2510.87, "total_tokens": 1413856} +{"current_steps": 2440, "total_steps": 134280, "loss": 0.659, "lr": 9.08176943699732e-06, "epoch": 0.3634197199880846, "percentage": 1.82, "elapsed_time": "0:09:24", "remaining_time": "8:28:08", "throughput": 2510.98, "total_tokens": 1416864} +{"current_steps": 2445, "total_steps": 134280, "loss": 0.6984, "lr": 9.100387250521298e-06, "epoch": 0.3641644325290438, "percentage": 1.82, "elapsed_time": "0:09:25", "remaining_time": "8:28:06", "throughput": 2510.89, "total_tokens": 1419680} +{"current_steps": 2450, "total_steps": 134280, "loss": 0.6694, "lr": 9.119005064045278e-06, "epoch": 0.364909145070003, "percentage": 1.82, "elapsed_time": "0:09:26", "remaining_time": "8:28:07", "throughput": 2510.89, "total_tokens": 1422656} +{"current_steps": 2455, "total_steps": 134280, "loss": 0.6768, "lr": 9.137622877569258e-06, "epoch": 0.3656538576109622, "percentage": 1.83, "elapsed_time": "0:09:27", "remaining_time": "8:28:05", "throughput": 2510.84, "total_tokens": 1425504} +{"current_steps": 2460, "total_steps": 134280, "loss": 0.9282, "lr": 9.156240691093238e-06, "epoch": 0.36639857015192134, "percentage": 1.83, "elapsed_time": "0:09:28", "remaining_time": "8:28:09", "throughput": 2510.91, "total_tokens": 1428704} +{"current_steps": 2465, "total_steps": 134280, "loss": 0.858, "lr": 9.174858504617218e-06, "epoch": 0.36714328269288055, "percentage": 1.84, "elapsed_time": "0:09:30", "remaining_time": "8:28:10", "throughput": 2511.0, "total_tokens": 1431744} +{"current_steps": 2470, "total_steps": 134280, "loss": 0.7574, "lr": 9.193476318141198e-06, "epoch": 0.36788799523383975, "percentage": 1.84, "elapsed_time": "0:09:31", "remaining_time": "8:28:13", "throughput": 2511.1, "total_tokens": 1434880} +{"current_steps": 2475, "total_steps": 134280, "loss": 0.6614, "lr": 9.212094131665178e-06, "epoch": 0.36863270777479895, "percentage": 1.84, "elapsed_time": "0:09:32", "remaining_time": "8:28:11", "throughput": 2511.08, "total_tokens": 1437728} +{"current_steps": 2480, "total_steps": 134280, "loss": 0.6218, "lr": 9.230711945189158e-06, "epoch": 0.3693774203157581, "percentage": 1.85, "elapsed_time": "0:09:33", "remaining_time": "8:28:10", "throughput": 2511.14, "total_tokens": 1440672} +{"current_steps": 2485, "total_steps": 134280, "loss": 0.6598, "lr": 9.249329758713138e-06, "epoch": 0.3701221328567173, "percentage": 1.85, "elapsed_time": "0:09:34", "remaining_time": "8:28:06", "throughput": 2511.1, "total_tokens": 1443424} +{"current_steps": 2490, "total_steps": 134280, "loss": 0.7236, "lr": 9.267947572237116e-06, "epoch": 0.3708668453976765, "percentage": 1.85, "elapsed_time": "0:09:35", "remaining_time": "8:28:04", "throughput": 2511.17, "total_tokens": 1446368} +{"current_steps": 2495, "total_steps": 134280, "loss": 0.6217, "lr": 9.286565385761096e-06, "epoch": 0.3716115579386357, "percentage": 1.86, "elapsed_time": "0:09:37", "remaining_time": "8:28:03", "throughput": 2511.05, "total_tokens": 1449184} +{"current_steps": 2500, "total_steps": 134280, "loss": 0.6284, "lr": 9.305183199285077e-06, "epoch": 0.37235627047959485, "percentage": 1.86, "elapsed_time": "0:09:38", "remaining_time": "8:28:03", "throughput": 2510.94, "total_tokens": 1452096} +{"current_steps": 2505, "total_steps": 134280, "loss": 0.8327, "lr": 9.323801012809057e-06, "epoch": 0.37310098302055406, "percentage": 1.87, "elapsed_time": "0:09:39", "remaining_time": "8:28:03", "throughput": 2510.94, "total_tokens": 1455040} +{"current_steps": 2510, "total_steps": 134280, "loss": 0.6333, "lr": 9.342418826333036e-06, "epoch": 0.37384569556151326, "percentage": 1.87, "elapsed_time": "0:09:40", "remaining_time": "8:28:01", "throughput": 2511.04, "total_tokens": 1457984} +{"current_steps": 2515, "total_steps": 134280, "loss": 0.665, "lr": 9.361036639857016e-06, "epoch": 0.37459040810247246, "percentage": 1.87, "elapsed_time": "0:09:41", "remaining_time": "8:28:00", "throughput": 2511.07, "total_tokens": 1460896} +{"current_steps": 2520, "total_steps": 134280, "loss": 0.5086, "lr": 9.379654453380995e-06, "epoch": 0.3753351206434316, "percentage": 1.88, "elapsed_time": "0:09:42", "remaining_time": "8:27:57", "throughput": 2511.19, "total_tokens": 1463776} +{"current_steps": 2525, "total_steps": 134280, "loss": 0.7674, "lr": 9.398272266904975e-06, "epoch": 0.3760798331843908, "percentage": 1.88, "elapsed_time": "0:09:43", "remaining_time": "8:27:52", "throughput": 2511.14, "total_tokens": 1466464} +{"current_steps": 2530, "total_steps": 134280, "loss": 0.6392, "lr": 9.416890080428954e-06, "epoch": 0.37682454572535, "percentage": 1.88, "elapsed_time": "0:09:45", "remaining_time": "8:27:53", "throughput": 2511.14, "total_tokens": 1469472} +{"current_steps": 2535, "total_steps": 134280, "loss": 0.6424, "lr": 9.435507893952934e-06, "epoch": 0.3775692582663092, "percentage": 1.89, "elapsed_time": "0:09:46", "remaining_time": "8:27:50", "throughput": 2511.08, "total_tokens": 1472256} +{"current_steps": 2540, "total_steps": 134280, "loss": 0.6139, "lr": 9.454125707476915e-06, "epoch": 0.3783139708072684, "percentage": 1.89, "elapsed_time": "0:09:47", "remaining_time": "8:27:51", "throughput": 2511.27, "total_tokens": 1475392} +{"current_steps": 2545, "total_steps": 134280, "loss": 0.6513, "lr": 9.472743521000895e-06, "epoch": 0.37905868334822757, "percentage": 1.9, "elapsed_time": "0:09:48", "remaining_time": "8:27:44", "throughput": 2510.99, "total_tokens": 1477856} +{"current_steps": 2550, "total_steps": 134280, "loss": 0.7555, "lr": 9.491361334524875e-06, "epoch": 0.37980339588918677, "percentage": 1.9, "elapsed_time": "0:09:49", "remaining_time": "8:27:43", "throughput": 2510.94, "total_tokens": 1480736} +{"current_steps": 2555, "total_steps": 134280, "loss": 0.7699, "lr": 9.509979148048853e-06, "epoch": 0.38054810843014597, "percentage": 1.9, "elapsed_time": "0:09:50", "remaining_time": "8:27:43", "throughput": 2510.96, "total_tokens": 1483680} +{"current_steps": 2560, "total_steps": 134280, "loss": 0.7395, "lr": 9.528596961572833e-06, "epoch": 0.3812928209711052, "percentage": 1.91, "elapsed_time": "0:09:52", "remaining_time": "8:27:41", "throughput": 2510.97, "total_tokens": 1486560} +{"current_steps": 2565, "total_steps": 134280, "loss": 0.7138, "lr": 9.547214775096813e-06, "epoch": 0.3820375335120643, "percentage": 1.91, "elapsed_time": "0:09:53", "remaining_time": "8:27:39", "throughput": 2510.92, "total_tokens": 1489376} +{"current_steps": 2570, "total_steps": 134280, "loss": 0.6484, "lr": 9.565832588620793e-06, "epoch": 0.3827822460530235, "percentage": 1.91, "elapsed_time": "0:09:54", "remaining_time": "8:27:38", "throughput": 2511.13, "total_tokens": 1492448} +{"current_steps": 2575, "total_steps": 134280, "loss": 0.6859, "lr": 9.584450402144771e-06, "epoch": 0.3835269585939827, "percentage": 1.92, "elapsed_time": "0:09:55", "remaining_time": "8:27:39", "throughput": 2511.13, "total_tokens": 1495424} +{"current_steps": 2580, "total_steps": 134280, "loss": 0.7025, "lr": 9.603068215668753e-06, "epoch": 0.38427167113494193, "percentage": 1.92, "elapsed_time": "0:09:56", "remaining_time": "8:27:38", "throughput": 2511.2, "total_tokens": 1498368} +{"current_steps": 2585, "total_steps": 134280, "loss": 0.6367, "lr": 9.621686029192733e-06, "epoch": 0.3850163836759011, "percentage": 1.93, "elapsed_time": "0:09:57", "remaining_time": "8:27:35", "throughput": 2511.11, "total_tokens": 1501152} +{"current_steps": 2590, "total_steps": 134280, "loss": 0.7616, "lr": 9.640303842716713e-06, "epoch": 0.3857610962168603, "percentage": 1.93, "elapsed_time": "0:09:58", "remaining_time": "8:27:34", "throughput": 2511.14, "total_tokens": 1504096} +{"current_steps": 2595, "total_steps": 134280, "loss": 0.7824, "lr": 9.658921656240691e-06, "epoch": 0.3865058087578195, "percentage": 1.93, "elapsed_time": "0:10:00", "remaining_time": "8:27:34", "throughput": 2511.27, "total_tokens": 1507136} +{"current_steps": 2600, "total_steps": 134280, "loss": 0.6308, "lr": 9.677539469764671e-06, "epoch": 0.3872505212987787, "percentage": 1.94, "elapsed_time": "0:10:01", "remaining_time": "8:27:31", "throughput": 2511.24, "total_tokens": 1509888} +{"current_steps": 2605, "total_steps": 134280, "loss": 0.7132, "lr": 9.69615728328865e-06, "epoch": 0.3879952338397379, "percentage": 1.94, "elapsed_time": "0:10:02", "remaining_time": "8:27:32", "throughput": 2511.32, "total_tokens": 1512960} +{"current_steps": 2610, "total_steps": 134280, "loss": 0.7371, "lr": 9.71477509681263e-06, "epoch": 0.38873994638069703, "percentage": 1.94, "elapsed_time": "0:10:03", "remaining_time": "8:27:27", "throughput": 2511.27, "total_tokens": 1515648} +{"current_steps": 2615, "total_steps": 134280, "loss": 0.6536, "lr": 9.73339291033661e-06, "epoch": 0.38948465892165623, "percentage": 1.95, "elapsed_time": "0:10:04", "remaining_time": "8:27:24", "throughput": 2511.2, "total_tokens": 1518432} +{"current_steps": 2620, "total_steps": 134280, "loss": 0.7652, "lr": 9.75201072386059e-06, "epoch": 0.39022937146261544, "percentage": 1.95, "elapsed_time": "0:10:05", "remaining_time": "8:27:20", "throughput": 2511.13, "total_tokens": 1521152} +{"current_steps": 2625, "total_steps": 134280, "loss": 0.7137, "lr": 9.77062853738457e-06, "epoch": 0.39097408400357464, "percentage": 1.95, "elapsed_time": "0:10:06", "remaining_time": "8:27:14", "throughput": 2511.03, "total_tokens": 1523744} +{"current_steps": 2630, "total_steps": 134280, "loss": 0.665, "lr": 9.78924635090855e-06, "epoch": 0.3917187965445338, "percentage": 1.96, "elapsed_time": "0:10:08", "remaining_time": "8:27:15", "throughput": 2510.99, "total_tokens": 1526720} +{"current_steps": 2635, "total_steps": 134280, "loss": 0.5688, "lr": 9.80786416443253e-06, "epoch": 0.392463509085493, "percentage": 1.96, "elapsed_time": "0:10:09", "remaining_time": "8:27:17", "throughput": 2511.0, "total_tokens": 1529792} +{"current_steps": 2640, "total_steps": 134280, "loss": 0.712, "lr": 9.826481977956509e-06, "epoch": 0.3932082216264522, "percentage": 1.97, "elapsed_time": "0:10:10", "remaining_time": "8:27:14", "throughput": 2510.91, "total_tokens": 1532544} +{"current_steps": 2645, "total_steps": 134280, "loss": 0.7112, "lr": 9.845099791480489e-06, "epoch": 0.3939529341674114, "percentage": 1.97, "elapsed_time": "0:10:11", "remaining_time": "8:27:15", "throughput": 2510.99, "total_tokens": 1535616} +{"current_steps": 2650, "total_steps": 134280, "loss": 0.7286, "lr": 9.863717605004468e-06, "epoch": 0.39469764670837054, "percentage": 1.97, "elapsed_time": "0:10:12", "remaining_time": "8:27:20", "throughput": 2511.27, "total_tokens": 1539008} +{"current_steps": 2655, "total_steps": 134280, "loss": 0.6745, "lr": 9.882335418528448e-06, "epoch": 0.39544235924932974, "percentage": 1.98, "elapsed_time": "0:10:13", "remaining_time": "8:27:18", "throughput": 2511.19, "total_tokens": 1541792} +{"current_steps": 2660, "total_steps": 134280, "loss": 0.6615, "lr": 9.900953232052428e-06, "epoch": 0.39618707179028895, "percentage": 1.98, "elapsed_time": "0:10:15", "remaining_time": "8:27:20", "throughput": 2511.18, "total_tokens": 1544864} +{"current_steps": 2665, "total_steps": 134280, "loss": 0.6747, "lr": 9.919571045576408e-06, "epoch": 0.39693178433124815, "percentage": 1.98, "elapsed_time": "0:10:16", "remaining_time": "8:27:22", "throughput": 2511.15, "total_tokens": 1547904} +{"current_steps": 2670, "total_steps": 134280, "loss": 0.6305, "lr": 9.938188859100388e-06, "epoch": 0.39767649687220735, "percentage": 1.99, "elapsed_time": "0:10:17", "remaining_time": "8:27:19", "throughput": 2511.09, "total_tokens": 1550688} +{"current_steps": 2675, "total_steps": 134280, "loss": 0.6713, "lr": 9.956806672624368e-06, "epoch": 0.3984212094131665, "percentage": 1.99, "elapsed_time": "0:10:18", "remaining_time": "8:27:23", "throughput": 2511.09, "total_tokens": 1553824} +{"current_steps": 2680, "total_steps": 134280, "loss": 0.5161, "lr": 9.975424486148348e-06, "epoch": 0.3991659219541257, "percentage": 2.0, "elapsed_time": "0:10:19", "remaining_time": "8:27:19", "throughput": 2511.06, "total_tokens": 1556576} +{"current_steps": 2685, "total_steps": 134280, "loss": 0.6303, "lr": 9.994042299672326e-06, "epoch": 0.3999106344950849, "percentage": 2.0, "elapsed_time": "0:10:20", "remaining_time": "8:27:15", "throughput": 2510.99, "total_tokens": 1559296} +{"current_steps": 2690, "total_steps": 134280, "loss": 0.6971, "lr": 1.0012660113196306e-05, "epoch": 0.4006553470360441, "percentage": 2.0, "elapsed_time": "0:10:22", "remaining_time": "8:27:15", "throughput": 2510.99, "total_tokens": 1562240} +{"current_steps": 2695, "total_steps": 134280, "loss": 0.5904, "lr": 1.0031277926720286e-05, "epoch": 0.40140005957700325, "percentage": 2.01, "elapsed_time": "0:10:23", "remaining_time": "8:27:13", "throughput": 2510.94, "total_tokens": 1565088} +{"current_steps": 2700, "total_steps": 134280, "loss": 0.656, "lr": 1.0049895740244266e-05, "epoch": 0.40214477211796246, "percentage": 2.01, "elapsed_time": "0:10:24", "remaining_time": "8:27:13", "throughput": 2510.85, "total_tokens": 1568000} +{"current_steps": 2705, "total_steps": 134280, "loss": 0.7777, "lr": 1.0068513553768246e-05, "epoch": 0.40288948465892166, "percentage": 2.01, "elapsed_time": "0:10:25", "remaining_time": "8:27:11", "throughput": 2510.94, "total_tokens": 1570912} +{"current_steps": 2710, "total_steps": 134280, "loss": 0.7816, "lr": 1.0087131367292226e-05, "epoch": 0.40363419719988086, "percentage": 2.02, "elapsed_time": "0:10:26", "remaining_time": "8:27:10", "throughput": 2510.99, "total_tokens": 1573888} +{"current_steps": 2715, "total_steps": 134280, "loss": 0.7147, "lr": 1.0105749180816206e-05, "epoch": 0.40437890974084, "percentage": 2.02, "elapsed_time": "0:10:27", "remaining_time": "8:27:08", "throughput": 2510.89, "total_tokens": 1576672} +{"current_steps": 2720, "total_steps": 134280, "loss": 0.5474, "lr": 1.0124366994340186e-05, "epoch": 0.4051236222817992, "percentage": 2.03, "elapsed_time": "0:10:29", "remaining_time": "8:27:05", "throughput": 2510.83, "total_tokens": 1579456} +{"current_steps": 2725, "total_steps": 134280, "loss": 0.7251, "lr": 1.0142984807864164e-05, "epoch": 0.4058683348227584, "percentage": 2.03, "elapsed_time": "0:10:30", "remaining_time": "8:27:00", "throughput": 2510.57, "total_tokens": 1581952} +{"current_steps": 2730, "total_steps": 134280, "loss": 0.657, "lr": 1.0161602621388144e-05, "epoch": 0.4066130473637176, "percentage": 2.03, "elapsed_time": "0:10:31", "remaining_time": "8:26:59", "throughput": 2510.57, "total_tokens": 1584864} +{"current_steps": 2735, "total_steps": 134280, "loss": 0.7365, "lr": 1.0180220434912124e-05, "epoch": 0.4073577599046768, "percentage": 2.04, "elapsed_time": "0:10:32", "remaining_time": "8:27:02", "throughput": 2510.83, "total_tokens": 1588160} +{"current_steps": 2740, "total_steps": 134280, "loss": 0.7556, "lr": 1.0198838248436104e-05, "epoch": 0.40810247244563597, "percentage": 2.04, "elapsed_time": "0:10:33", "remaining_time": "8:26:58", "throughput": 2510.77, "total_tokens": 1590880} +{"current_steps": 2745, "total_steps": 134280, "loss": 0.7406, "lr": 1.0217456061960085e-05, "epoch": 0.40884718498659517, "percentage": 2.04, "elapsed_time": "0:10:34", "remaining_time": "8:26:54", "throughput": 2510.71, "total_tokens": 1593600} +{"current_steps": 2750, "total_steps": 134280, "loss": 0.8826, "lr": 1.0236073875484064e-05, "epoch": 0.40959189752755437, "percentage": 2.05, "elapsed_time": "0:10:35", "remaining_time": "8:26:53", "throughput": 2510.7, "total_tokens": 1596512} +{"current_steps": 2755, "total_steps": 134280, "loss": 0.6347, "lr": 1.0254691689008044e-05, "epoch": 0.4103366100685136, "percentage": 2.05, "elapsed_time": "0:10:37", "remaining_time": "8:26:50", "throughput": 2510.65, "total_tokens": 1599296} +{"current_steps": 2760, "total_steps": 134280, "loss": 0.6868, "lr": 1.0273309502532023e-05, "epoch": 0.4110813226094727, "percentage": 2.06, "elapsed_time": "0:10:38", "remaining_time": "8:26:49", "throughput": 2510.72, "total_tokens": 1602208} +{"current_steps": 2765, "total_steps": 134280, "loss": 0.7353, "lr": 1.0291927316056003e-05, "epoch": 0.4118260351504319, "percentage": 2.06, "elapsed_time": "0:10:39", "remaining_time": "8:26:49", "throughput": 2510.72, "total_tokens": 1605184} +{"current_steps": 2770, "total_steps": 134280, "loss": 0.6722, "lr": 1.0310545129579982e-05, "epoch": 0.4125707476913911, "percentage": 2.06, "elapsed_time": "0:10:40", "remaining_time": "8:26:47", "throughput": 2510.73, "total_tokens": 1608032} +{"current_steps": 2775, "total_steps": 134280, "loss": 0.7214, "lr": 1.0329162943103962e-05, "epoch": 0.41331546023235033, "percentage": 2.07, "elapsed_time": "0:10:41", "remaining_time": "8:26:48", "throughput": 2510.8, "total_tokens": 1611104} +{"current_steps": 2780, "total_steps": 134280, "loss": 0.7364, "lr": 1.0347780756627941e-05, "epoch": 0.4140601727733095, "percentage": 2.07, "elapsed_time": "0:10:42", "remaining_time": "8:26:47", "throughput": 2510.8, "total_tokens": 1614048} +{"current_steps": 2785, "total_steps": 134280, "loss": 0.8323, "lr": 1.0366398570151923e-05, "epoch": 0.4148048853142687, "percentage": 2.07, "elapsed_time": "0:10:44", "remaining_time": "8:26:48", "throughput": 2510.81, "total_tokens": 1617056} +{"current_steps": 2790, "total_steps": 134280, "loss": 0.7618, "lr": 1.0385016383675901e-05, "epoch": 0.4155495978552279, "percentage": 2.08, "elapsed_time": "0:10:45", "remaining_time": "8:26:44", "throughput": 2510.61, "total_tokens": 1619680} +{"current_steps": 2795, "total_steps": 134280, "loss": 0.683, "lr": 1.0403634197199881e-05, "epoch": 0.4162943103961871, "percentage": 2.08, "elapsed_time": "0:10:46", "remaining_time": "8:26:46", "throughput": 2510.68, "total_tokens": 1622816} +{"current_steps": 2800, "total_steps": 134280, "loss": 0.7641, "lr": 1.0422252010723861e-05, "epoch": 0.4170390229371463, "percentage": 2.09, "elapsed_time": "0:10:47", "remaining_time": "8:26:45", "throughput": 2510.65, "total_tokens": 1625664} +{"current_steps": 2805, "total_steps": 134280, "loss": 0.7152, "lr": 1.0440869824247841e-05, "epoch": 0.41778373547810543, "percentage": 2.09, "elapsed_time": "0:10:48", "remaining_time": "8:26:42", "throughput": 2510.51, "total_tokens": 1628384} +{"current_steps": 2810, "total_steps": 134280, "loss": 0.6084, "lr": 1.0459487637771821e-05, "epoch": 0.41852844801906464, "percentage": 2.09, "elapsed_time": "0:10:49", "remaining_time": "8:26:45", "throughput": 2510.67, "total_tokens": 1631616} +{"current_steps": 2815, "total_steps": 134280, "loss": 0.6904, "lr": 1.04781054512958e-05, "epoch": 0.41927316056002384, "percentage": 2.1, "elapsed_time": "0:10:50", "remaining_time": "8:26:41", "throughput": 2510.55, "total_tokens": 1634304} +{"current_steps": 2820, "total_steps": 134280, "loss": 0.6478, "lr": 1.049672326481978e-05, "epoch": 0.42001787310098304, "percentage": 2.1, "elapsed_time": "0:10:52", "remaining_time": "8:26:41", "throughput": 2510.65, "total_tokens": 1637312} +{"current_steps": 2825, "total_steps": 134280, "loss": 0.7495, "lr": 1.051534107834376e-05, "epoch": 0.4207625856419422, "percentage": 2.1, "elapsed_time": "0:10:53", "remaining_time": "8:26:40", "throughput": 2510.59, "total_tokens": 1640192} +{"current_steps": 2830, "total_steps": 134280, "loss": 0.7379, "lr": 1.053395889186774e-05, "epoch": 0.4215072981829014, "percentage": 2.11, "elapsed_time": "0:10:54", "remaining_time": "8:26:37", "throughput": 2510.56, "total_tokens": 1643008} +{"current_steps": 2835, "total_steps": 134280, "loss": 0.8693, "lr": 1.0552576705391719e-05, "epoch": 0.4222520107238606, "percentage": 2.11, "elapsed_time": "0:10:55", "remaining_time": "8:26:33", "throughput": 2510.51, "total_tokens": 1645696} +{"current_steps": 2840, "total_steps": 134280, "loss": 0.7489, "lr": 1.0571194518915699e-05, "epoch": 0.4229967232648198, "percentage": 2.11, "elapsed_time": "0:10:56", "remaining_time": "8:26:30", "throughput": 2510.4, "total_tokens": 1648448} +{"current_steps": 2845, "total_steps": 134280, "loss": 0.7749, "lr": 1.0589812332439679e-05, "epoch": 0.42374143580577894, "percentage": 2.12, "elapsed_time": "0:10:57", "remaining_time": "8:26:30", "throughput": 2510.43, "total_tokens": 1651392} +{"current_steps": 2850, "total_steps": 134280, "loss": 0.7086, "lr": 1.0608430145963659e-05, "epoch": 0.42448614834673815, "percentage": 2.12, "elapsed_time": "0:10:58", "remaining_time": "8:26:28", "throughput": 2510.35, "total_tokens": 1654240} +{"current_steps": 2855, "total_steps": 134280, "loss": 0.6217, "lr": 1.0627047959487637e-05, "epoch": 0.42523086088769735, "percentage": 2.13, "elapsed_time": "0:11:00", "remaining_time": "8:26:27", "throughput": 2510.27, "total_tokens": 1657088} +{"current_steps": 2860, "total_steps": 134280, "loss": 0.7277, "lr": 1.0645665773011617e-05, "epoch": 0.42597557342865655, "percentage": 2.13, "elapsed_time": "0:11:01", "remaining_time": "8:26:24", "throughput": 2510.1, "total_tokens": 1659744} +{"current_steps": 2865, "total_steps": 134280, "loss": 0.6812, "lr": 1.0664283586535598e-05, "epoch": 0.42672028596961575, "percentage": 2.13, "elapsed_time": "0:11:02", "remaining_time": "8:26:24", "throughput": 2509.96, "total_tokens": 1662656} +{"current_steps": 2870, "total_steps": 134280, "loss": 0.6383, "lr": 1.0682901400059578e-05, "epoch": 0.4274649985105749, "percentage": 2.14, "elapsed_time": "0:11:03", "remaining_time": "8:26:21", "throughput": 2509.87, "total_tokens": 1665408} +{"current_steps": 2875, "total_steps": 134280, "loss": 0.5172, "lr": 1.0701519213583558e-05, "epoch": 0.4282097110515341, "percentage": 2.14, "elapsed_time": "0:11:04", "remaining_time": "8:26:19", "throughput": 2509.77, "total_tokens": 1668160} +{"current_steps": 2880, "total_steps": 134280, "loss": 0.7279, "lr": 1.0720137027107537e-05, "epoch": 0.4289544235924933, "percentage": 2.14, "elapsed_time": "0:11:05", "remaining_time": "8:26:20", "throughput": 2509.84, "total_tokens": 1671232} +{"current_steps": 2885, "total_steps": 134280, "loss": 0.6307, "lr": 1.0738754840631517e-05, "epoch": 0.4296991361334525, "percentage": 2.15, "elapsed_time": "0:11:07", "remaining_time": "8:26:21", "throughput": 2509.94, "total_tokens": 1674336} +{"current_steps": 2890, "total_steps": 134280, "loss": 0.7972, "lr": 1.0757372654155496e-05, "epoch": 0.43044384867441166, "percentage": 2.15, "elapsed_time": "0:11:08", "remaining_time": "8:26:20", "throughput": 2509.89, "total_tokens": 1677184} +{"current_steps": 2895, "total_steps": 134280, "loss": 0.8635, "lr": 1.0775990467679476e-05, "epoch": 0.43118856121537086, "percentage": 2.16, "elapsed_time": "0:11:09", "remaining_time": "8:26:16", "throughput": 2509.79, "total_tokens": 1679904} +{"current_steps": 2900, "total_steps": 134280, "loss": 0.633, "lr": 1.0794608281203456e-05, "epoch": 0.43193327375633006, "percentage": 2.16, "elapsed_time": "0:11:10", "remaining_time": "8:26:13", "throughput": 2509.75, "total_tokens": 1682656} +{"current_steps": 2905, "total_steps": 134280, "loss": 0.6222, "lr": 1.0813226094727436e-05, "epoch": 0.43267798629728926, "percentage": 2.16, "elapsed_time": "0:11:11", "remaining_time": "8:26:10", "throughput": 2509.73, "total_tokens": 1685440} +{"current_steps": 2910, "total_steps": 134280, "loss": 0.7166, "lr": 1.0831843908251416e-05, "epoch": 0.4334226988382484, "percentage": 2.17, "elapsed_time": "0:11:12", "remaining_time": "8:26:07", "throughput": 2509.8, "total_tokens": 1688288} +{"current_steps": 2915, "total_steps": 134280, "loss": 0.5439, "lr": 1.0850461721775396e-05, "epoch": 0.4341674113792076, "percentage": 2.17, "elapsed_time": "0:11:13", "remaining_time": "8:26:07", "throughput": 2509.86, "total_tokens": 1691264} +{"current_steps": 2920, "total_steps": 134280, "loss": 0.7129, "lr": 1.0869079535299374e-05, "epoch": 0.4349121239201668, "percentage": 2.17, "elapsed_time": "0:11:15", "remaining_time": "8:26:06", "throughput": 2509.89, "total_tokens": 1694240} +{"current_steps": 2925, "total_steps": 134280, "loss": 0.7334, "lr": 1.0887697348823354e-05, "epoch": 0.435656836461126, "percentage": 2.18, "elapsed_time": "0:11:16", "remaining_time": "8:26:06", "throughput": 2509.84, "total_tokens": 1697152} +{"current_steps": 2930, "total_steps": 134280, "loss": 0.6296, "lr": 1.0906315162347334e-05, "epoch": 0.4364015490020852, "percentage": 2.18, "elapsed_time": "0:11:17", "remaining_time": "8:26:03", "throughput": 2509.81, "total_tokens": 1699936} +{"current_steps": 2935, "total_steps": 134280, "loss": 0.6725, "lr": 1.0924932975871314e-05, "epoch": 0.43714626154304437, "percentage": 2.19, "elapsed_time": "0:11:18", "remaining_time": "8:26:02", "throughput": 2509.84, "total_tokens": 1702880} +{"current_steps": 2940, "total_steps": 134280, "loss": 0.6637, "lr": 1.0943550789395294e-05, "epoch": 0.43789097408400357, "percentage": 2.19, "elapsed_time": "0:11:19", "remaining_time": "8:26:00", "throughput": 2509.77, "total_tokens": 1705664} +{"current_steps": 2945, "total_steps": 134280, "loss": 0.6478, "lr": 1.0962168602919274e-05, "epoch": 0.4386356866249628, "percentage": 2.19, "elapsed_time": "0:11:20", "remaining_time": "8:25:57", "throughput": 2509.74, "total_tokens": 1708416} +{"current_steps": 2950, "total_steps": 134280, "loss": 0.5258, "lr": 1.0980786416443254e-05, "epoch": 0.439380399165922, "percentage": 2.2, "elapsed_time": "0:11:21", "remaining_time": "8:25:56", "throughput": 2509.84, "total_tokens": 1711424} +{"current_steps": 2955, "total_steps": 134280, "loss": 0.9414, "lr": 1.0999404229967234e-05, "epoch": 0.4401251117068811, "percentage": 2.2, "elapsed_time": "0:11:22", "remaining_time": "8:25:53", "throughput": 2509.85, "total_tokens": 1714208} +{"current_steps": 2960, "total_steps": 134280, "loss": 0.6444, "lr": 1.1018022043491214e-05, "epoch": 0.4408698242478403, "percentage": 2.2, "elapsed_time": "0:11:24", "remaining_time": "8:25:50", "throughput": 2509.8, "total_tokens": 1716992} +{"current_steps": 2965, "total_steps": 134280, "loss": 0.9815, "lr": 1.1036639857015192e-05, "epoch": 0.4416145367887995, "percentage": 2.21, "elapsed_time": "0:11:25", "remaining_time": "8:25:48", "throughput": 2509.77, "total_tokens": 1719840} +{"current_steps": 2970, "total_steps": 134280, "loss": 0.6757, "lr": 1.1055257670539172e-05, "epoch": 0.44235924932975873, "percentage": 2.21, "elapsed_time": "0:11:26", "remaining_time": "8:25:44", "throughput": 2509.61, "total_tokens": 1722464} +{"current_steps": 2975, "total_steps": 134280, "loss": 0.6321, "lr": 1.1073875484063152e-05, "epoch": 0.4431039618707179, "percentage": 2.22, "elapsed_time": "0:11:27", "remaining_time": "8:25:41", "throughput": 2509.59, "total_tokens": 1725216} +{"current_steps": 2980, "total_steps": 134280, "loss": 0.7762, "lr": 1.1092493297587132e-05, "epoch": 0.4438486744116771, "percentage": 2.22, "elapsed_time": "0:11:28", "remaining_time": "8:25:38", "throughput": 2509.54, "total_tokens": 1728000} +{"current_steps": 2985, "total_steps": 134280, "loss": 0.6389, "lr": 1.1111111111111112e-05, "epoch": 0.4445933869526363, "percentage": 2.22, "elapsed_time": "0:11:29", "remaining_time": "8:25:38", "throughput": 2509.47, "total_tokens": 1730912} +{"current_steps": 2990, "total_steps": 134280, "loss": 0.6689, "lr": 1.1129728924635092e-05, "epoch": 0.4453380994935955, "percentage": 2.23, "elapsed_time": "0:11:30", "remaining_time": "8:25:34", "throughput": 2509.39, "total_tokens": 1733600} +{"current_steps": 2995, "total_steps": 134280, "loss": 0.5399, "lr": 1.1148346738159071e-05, "epoch": 0.4460828120345547, "percentage": 2.23, "elapsed_time": "0:11:31", "remaining_time": "8:25:33", "throughput": 2509.38, "total_tokens": 1736480} +{"current_steps": 3000, "total_steps": 134280, "loss": 0.5669, "lr": 1.1166964551683051e-05, "epoch": 0.44682752457551383, "percentage": 2.23, "elapsed_time": "0:11:33", "remaining_time": "8:25:31", "throughput": 2509.28, "total_tokens": 1739264} +{"current_steps": 3005, "total_steps": 134280, "loss": 0.6507, "lr": 1.1185582365207031e-05, "epoch": 0.44757223711647304, "percentage": 2.24, "elapsed_time": "0:11:34", "remaining_time": "8:25:32", "throughput": 2509.35, "total_tokens": 1742336} +{"current_steps": 3010, "total_steps": 134280, "loss": 0.6872, "lr": 1.120420017873101e-05, "epoch": 0.44831694965743224, "percentage": 2.24, "elapsed_time": "0:11:35", "remaining_time": "8:25:30", "throughput": 2509.38, "total_tokens": 1745216} +{"current_steps": 3015, "total_steps": 134280, "loss": 0.781, "lr": 1.122281799225499e-05, "epoch": 0.44906166219839144, "percentage": 2.25, "elapsed_time": "0:11:36", "remaining_time": "8:25:30", "throughput": 2509.44, "total_tokens": 1748192} +{"current_steps": 3020, "total_steps": 134280, "loss": 0.9747, "lr": 1.124143580577897e-05, "epoch": 0.4498063747393506, "percentage": 2.25, "elapsed_time": "0:11:37", "remaining_time": "8:25:27", "throughput": 2509.39, "total_tokens": 1750944} +{"current_steps": 3025, "total_steps": 134280, "loss": 0.6629, "lr": 1.126005361930295e-05, "epoch": 0.4505510872803098, "percentage": 2.25, "elapsed_time": "0:11:38", "remaining_time": "8:25:26", "throughput": 2509.39, "total_tokens": 1753856} +{"current_steps": 3030, "total_steps": 134280, "loss": 0.6627, "lr": 1.127867143282693e-05, "epoch": 0.451295799821269, "percentage": 2.26, "elapsed_time": "0:11:40", "remaining_time": "8:25:26", "throughput": 2509.46, "total_tokens": 1756896} +{"current_steps": 3035, "total_steps": 134280, "loss": 0.7388, "lr": 1.129728924635091e-05, "epoch": 0.4520405123622282, "percentage": 2.26, "elapsed_time": "0:11:41", "remaining_time": "8:25:27", "throughput": 2509.62, "total_tokens": 1760032} +{"current_steps": 3040, "total_steps": 134280, "loss": 0.6431, "lr": 1.1315907059874889e-05, "epoch": 0.45278522490318734, "percentage": 2.26, "elapsed_time": "0:11:42", "remaining_time": "8:25:25", "throughput": 2509.61, "total_tokens": 1762848} +{"current_steps": 3045, "total_steps": 134280, "loss": 0.7241, "lr": 1.1334524873398869e-05, "epoch": 0.45352993744414655, "percentage": 2.27, "elapsed_time": "0:11:43", "remaining_time": "8:25:24", "throughput": 2509.6, "total_tokens": 1765760} +{"current_steps": 3050, "total_steps": 134280, "loss": 0.592, "lr": 1.1353142686922847e-05, "epoch": 0.45427464998510575, "percentage": 2.27, "elapsed_time": "0:11:44", "remaining_time": "8:25:22", "throughput": 2509.58, "total_tokens": 1768608} +{"current_steps": 3055, "total_steps": 134280, "loss": 0.729, "lr": 1.1371760500446827e-05, "epoch": 0.45501936252606495, "percentage": 2.28, "elapsed_time": "0:11:45", "remaining_time": "8:25:24", "throughput": 2509.73, "total_tokens": 1771808} +{"current_steps": 3060, "total_steps": 134280, "loss": 0.6005, "lr": 1.1390378313970807e-05, "epoch": 0.45576407506702415, "percentage": 2.28, "elapsed_time": "0:11:47", "remaining_time": "8:25:22", "throughput": 2509.75, "total_tokens": 1774656} +{"current_steps": 3065, "total_steps": 134280, "loss": 0.7877, "lr": 1.1408996127494787e-05, "epoch": 0.4565087876079833, "percentage": 2.28, "elapsed_time": "0:11:48", "remaining_time": "8:25:20", "throughput": 2509.8, "total_tokens": 1777568} +{"current_steps": 3070, "total_steps": 134280, "loss": 0.7914, "lr": 1.1427613941018769e-05, "epoch": 0.4572535001489425, "percentage": 2.29, "elapsed_time": "0:11:49", "remaining_time": "8:25:22", "throughput": 2509.81, "total_tokens": 1780672} +{"current_steps": 3075, "total_steps": 134280, "loss": 0.6163, "lr": 1.1446231754542747e-05, "epoch": 0.4579982126899017, "percentage": 2.29, "elapsed_time": "0:11:50", "remaining_time": "8:25:19", "throughput": 2509.79, "total_tokens": 1783424} +{"current_steps": 3080, "total_steps": 134280, "loss": 0.6992, "lr": 1.1464849568066727e-05, "epoch": 0.4587429252308609, "percentage": 2.29, "elapsed_time": "0:11:51", "remaining_time": "8:25:16", "throughput": 2509.77, "total_tokens": 1786176} +{"current_steps": 3085, "total_steps": 134280, "loss": 0.8996, "lr": 1.1483467381590707e-05, "epoch": 0.45948763777182006, "percentage": 2.3, "elapsed_time": "0:11:52", "remaining_time": "8:25:13", "throughput": 2509.68, "total_tokens": 1788896} +{"current_steps": 3090, "total_steps": 134280, "loss": 0.8595, "lr": 1.1502085195114687e-05, "epoch": 0.46023235031277926, "percentage": 2.3, "elapsed_time": "0:11:53", "remaining_time": "8:25:12", "throughput": 2509.71, "total_tokens": 1791840} +{"current_steps": 3095, "total_steps": 134280, "loss": 0.5474, "lr": 1.1520703008638665e-05, "epoch": 0.46097706285373846, "percentage": 2.3, "elapsed_time": "0:11:55", "remaining_time": "8:25:10", "throughput": 2509.79, "total_tokens": 1794752} +{"current_steps": 3100, "total_steps": 134280, "loss": 0.6348, "lr": 1.1539320822162645e-05, "epoch": 0.46172177539469766, "percentage": 2.31, "elapsed_time": "0:11:56", "remaining_time": "8:25:07", "throughput": 2509.77, "total_tokens": 1797568} +{"current_steps": 3105, "total_steps": 134280, "loss": 0.84, "lr": 1.1557938635686626e-05, "epoch": 0.4624664879356568, "percentage": 2.31, "elapsed_time": "0:11:57", "remaining_time": "8:25:10", "throughput": 2509.91, "total_tokens": 1800768} +{"current_steps": 3110, "total_steps": 134280, "loss": 0.7101, "lr": 1.1576556449210606e-05, "epoch": 0.463211200476616, "percentage": 2.32, "elapsed_time": "0:11:58", "remaining_time": "8:25:09", "throughput": 2509.97, "total_tokens": 1803744} +{"current_steps": 3115, "total_steps": 134280, "loss": 0.6717, "lr": 1.1595174262734585e-05, "epoch": 0.4639559130175752, "percentage": 2.32, "elapsed_time": "0:11:59", "remaining_time": "8:25:08", "throughput": 2509.94, "total_tokens": 1806624} +{"current_steps": 3120, "total_steps": 134280, "loss": 0.828, "lr": 1.1613792076258565e-05, "epoch": 0.4647006255585344, "percentage": 2.32, "elapsed_time": "0:12:00", "remaining_time": "8:25:07", "throughput": 2510.0, "total_tokens": 1809600} +{"current_steps": 3125, "total_steps": 134280, "loss": 0.6971, "lr": 1.1632409889782545e-05, "epoch": 0.4654453380994936, "percentage": 2.33, "elapsed_time": "0:12:02", "remaining_time": "8:25:06", "throughput": 2509.96, "total_tokens": 1812480} +{"current_steps": 3130, "total_steps": 134280, "loss": 0.6242, "lr": 1.1651027703306524e-05, "epoch": 0.46619005064045277, "percentage": 2.33, "elapsed_time": "0:12:03", "remaining_time": "8:25:04", "throughput": 2510.0, "total_tokens": 1815328} +{"current_steps": 3135, "total_steps": 134280, "loss": 0.7664, "lr": 1.1669645516830504e-05, "epoch": 0.46693476318141197, "percentage": 2.33, "elapsed_time": "0:12:04", "remaining_time": "8:25:05", "throughput": 2509.98, "total_tokens": 1818368} +{"current_steps": 3140, "total_steps": 134280, "loss": 0.6773, "lr": 1.1688263330354483e-05, "epoch": 0.4676794757223712, "percentage": 2.34, "elapsed_time": "0:12:05", "remaining_time": "8:25:05", "throughput": 2509.98, "total_tokens": 1821312} +{"current_steps": 3145, "total_steps": 134280, "loss": 0.7166, "lr": 1.1706881143878464e-05, "epoch": 0.4684241882633304, "percentage": 2.34, "elapsed_time": "0:12:06", "remaining_time": "8:25:09", "throughput": 2510.17, "total_tokens": 1824640} +{"current_steps": 3150, "total_steps": 134280, "loss": 0.6002, "lr": 1.1725498957402444e-05, "epoch": 0.4691689008042895, "percentage": 2.35, "elapsed_time": "0:12:08", "remaining_time": "8:25:06", "throughput": 2510.09, "total_tokens": 1827392} +{"current_steps": 3155, "total_steps": 134280, "loss": 0.7628, "lr": 1.1744116770926424e-05, "epoch": 0.4699136133452487, "percentage": 2.35, "elapsed_time": "0:12:09", "remaining_time": "8:25:02", "throughput": 2510.06, "total_tokens": 1830080} +{"current_steps": 3160, "total_steps": 134280, "loss": 0.7691, "lr": 1.1762734584450402e-05, "epoch": 0.47065832588620793, "percentage": 2.35, "elapsed_time": "0:12:10", "remaining_time": "8:25:01", "throughput": 2510.09, "total_tokens": 1833024} +{"current_steps": 3165, "total_steps": 134280, "loss": 0.7036, "lr": 1.1781352397974382e-05, "epoch": 0.47140303842716713, "percentage": 2.36, "elapsed_time": "0:12:11", "remaining_time": "8:24:57", "throughput": 2509.97, "total_tokens": 1835680} +{"current_steps": 3170, "total_steps": 134280, "loss": 0.6602, "lr": 1.1799970211498362e-05, "epoch": 0.4721477509681263, "percentage": 2.36, "elapsed_time": "0:12:12", "remaining_time": "8:24:55", "throughput": 2509.9, "total_tokens": 1838464} +{"current_steps": 3175, "total_steps": 134280, "loss": 0.6873, "lr": 1.1818588025022342e-05, "epoch": 0.4728924635090855, "percentage": 2.36, "elapsed_time": "0:12:13", "remaining_time": "8:24:58", "throughput": 2510.04, "total_tokens": 1841728} +{"current_steps": 3180, "total_steps": 134280, "loss": 0.694, "lr": 1.183720583854632e-05, "epoch": 0.4736371760500447, "percentage": 2.37, "elapsed_time": "0:12:14", "remaining_time": "8:24:56", "throughput": 2510.03, "total_tokens": 1844576} +{"current_steps": 3185, "total_steps": 134280, "loss": 0.725, "lr": 1.1855823652070302e-05, "epoch": 0.4743818885910039, "percentage": 2.37, "elapsed_time": "0:12:16", "remaining_time": "8:24:53", "throughput": 2509.95, "total_tokens": 1847328} +{"current_steps": 3190, "total_steps": 134280, "loss": 0.7216, "lr": 1.1874441465594282e-05, "epoch": 0.4751266011319631, "percentage": 2.38, "elapsed_time": "0:12:17", "remaining_time": "8:24:53", "throughput": 2509.89, "total_tokens": 1850240} +{"current_steps": 3195, "total_steps": 134280, "loss": 0.6005, "lr": 1.1893059279118262e-05, "epoch": 0.47587131367292224, "percentage": 2.38, "elapsed_time": "0:12:18", "remaining_time": "8:24:53", "throughput": 2509.95, "total_tokens": 1853216} +{"current_steps": 3200, "total_steps": 134280, "loss": 0.5401, "lr": 1.1911677092642242e-05, "epoch": 0.47661602621388144, "percentage": 2.38, "elapsed_time": "0:12:19", "remaining_time": "8:24:49", "throughput": 2509.96, "total_tokens": 1856000} +{"current_steps": 3205, "total_steps": 134280, "loss": 0.6845, "lr": 1.193029490616622e-05, "epoch": 0.47736073875484064, "percentage": 2.39, "elapsed_time": "0:12:20", "remaining_time": "8:24:47", "throughput": 2510.04, "total_tokens": 1858912} +{"current_steps": 3210, "total_steps": 134280, "loss": 0.7349, "lr": 1.19489127196902e-05, "epoch": 0.47810545129579984, "percentage": 2.39, "elapsed_time": "0:12:21", "remaining_time": "8:24:52", "throughput": 2510.18, "total_tokens": 1862240} +{"current_steps": 3215, "total_steps": 134280, "loss": 0.8585, "lr": 1.196753053321418e-05, "epoch": 0.478850163836759, "percentage": 2.39, "elapsed_time": "0:12:22", "remaining_time": "8:24:48", "throughput": 2510.06, "total_tokens": 1864896} +{"current_steps": 3220, "total_steps": 134280, "loss": 0.7113, "lr": 1.198614834673816e-05, "epoch": 0.4795948763777182, "percentage": 2.4, "elapsed_time": "0:12:24", "remaining_time": "8:24:48", "throughput": 2510.1, "total_tokens": 1867904} +{"current_steps": 3225, "total_steps": 134280, "loss": 0.7082, "lr": 1.200476616026214e-05, "epoch": 0.4803395889186774, "percentage": 2.4, "elapsed_time": "0:12:25", "remaining_time": "8:24:43", "throughput": 2509.98, "total_tokens": 1870496} +{"current_steps": 3230, "total_steps": 134280, "loss": 0.5399, "lr": 1.202338397378612e-05, "epoch": 0.4810843014596366, "percentage": 2.41, "elapsed_time": "0:12:26", "remaining_time": "8:24:40", "throughput": 2509.86, "total_tokens": 1873152} +{"current_steps": 3235, "total_steps": 134280, "loss": 0.6395, "lr": 1.20420017873101e-05, "epoch": 0.48182901400059575, "percentage": 2.41, "elapsed_time": "0:12:27", "remaining_time": "8:24:38", "throughput": 2509.92, "total_tokens": 1876096} +{"current_steps": 3240, "total_steps": 134280, "loss": 0.7054, "lr": 1.206061960083408e-05, "epoch": 0.48257372654155495, "percentage": 2.41, "elapsed_time": "0:12:28", "remaining_time": "8:24:40", "throughput": 2509.94, "total_tokens": 1879168} +{"current_steps": 3245, "total_steps": 134280, "loss": 0.6064, "lr": 1.2079237414358058e-05, "epoch": 0.48331843908251415, "percentage": 2.42, "elapsed_time": "0:12:29", "remaining_time": "8:24:42", "throughput": 2510.02, "total_tokens": 1882304} +{"current_steps": 3250, "total_steps": 134280, "loss": 0.7087, "lr": 1.2097855227882038e-05, "epoch": 0.48406315162347335, "percentage": 2.42, "elapsed_time": "0:12:31", "remaining_time": "8:24:39", "throughput": 2510.0, "total_tokens": 1885120} +{"current_steps": 3255, "total_steps": 134280, "loss": 0.622, "lr": 1.2116473041406018e-05, "epoch": 0.48480786416443256, "percentage": 2.42, "elapsed_time": "0:12:32", "remaining_time": "8:24:37", "throughput": 2509.99, "total_tokens": 1887968} +{"current_steps": 3260, "total_steps": 134280, "loss": 0.8116, "lr": 1.2135090854929997e-05, "epoch": 0.4855525767053917, "percentage": 2.43, "elapsed_time": "0:12:33", "remaining_time": "8:24:33", "throughput": 2509.99, "total_tokens": 1890688} +{"current_steps": 3265, "total_steps": 134280, "loss": 0.4603, "lr": 1.2153708668453977e-05, "epoch": 0.4862972892463509, "percentage": 2.43, "elapsed_time": "0:12:34", "remaining_time": "8:24:30", "throughput": 2509.94, "total_tokens": 1893408} +{"current_steps": 3270, "total_steps": 134280, "loss": 0.4725, "lr": 1.2172326481977957e-05, "epoch": 0.4870420017873101, "percentage": 2.44, "elapsed_time": "0:12:35", "remaining_time": "8:24:28", "throughput": 2509.98, "total_tokens": 1896288} +{"current_steps": 3275, "total_steps": 134280, "loss": 1.0182, "lr": 1.2190944295501937e-05, "epoch": 0.4877867143282693, "percentage": 2.44, "elapsed_time": "0:12:36", "remaining_time": "8:24:29", "throughput": 2509.98, "total_tokens": 1899296} +{"current_steps": 3280, "total_steps": 134280, "loss": 0.7142, "lr": 1.2209562109025917e-05, "epoch": 0.48853142686922846, "percentage": 2.44, "elapsed_time": "0:12:37", "remaining_time": "8:24:27", "throughput": 2510.0, "total_tokens": 1902176} +{"current_steps": 3285, "total_steps": 134280, "loss": 0.5823, "lr": 1.2228179922549897e-05, "epoch": 0.48927613941018766, "percentage": 2.45, "elapsed_time": "0:12:38", "remaining_time": "8:24:24", "throughput": 2510.01, "total_tokens": 1904992} +{"current_steps": 3290, "total_steps": 134280, "loss": 0.7443, "lr": 1.2246797736073875e-05, "epoch": 0.49002085195114686, "percentage": 2.45, "elapsed_time": "0:12:40", "remaining_time": "8:24:23", "throughput": 2510.08, "total_tokens": 1907936} +{"current_steps": 3295, "total_steps": 134280, "loss": 0.5885, "lr": 1.2265415549597855e-05, "epoch": 0.49076556449210607, "percentage": 2.45, "elapsed_time": "0:12:41", "remaining_time": "8:24:23", "throughput": 2510.28, "total_tokens": 1911072} +{"current_steps": 3300, "total_steps": 134280, "loss": 0.728, "lr": 1.2284033363121835e-05, "epoch": 0.4915102770330652, "percentage": 2.46, "elapsed_time": "0:12:42", "remaining_time": "8:24:20", "throughput": 2510.2, "total_tokens": 1913792} +{"current_steps": 3305, "total_steps": 134280, "loss": 0.658, "lr": 1.2302651176645815e-05, "epoch": 0.4922549895740244, "percentage": 2.46, "elapsed_time": "0:12:43", "remaining_time": "8:24:20", "throughput": 2510.35, "total_tokens": 1916864} +{"current_steps": 3310, "total_steps": 134280, "loss": 0.5509, "lr": 1.2321268990169795e-05, "epoch": 0.4929997021149836, "percentage": 2.46, "elapsed_time": "0:12:44", "remaining_time": "8:24:25", "throughput": 2510.34, "total_tokens": 1920128} +{"current_steps": 3315, "total_steps": 134280, "loss": 0.6228, "lr": 1.2339886803693775e-05, "epoch": 0.4937444146559428, "percentage": 2.47, "elapsed_time": "0:12:46", "remaining_time": "8:24:22", "throughput": 2510.35, "total_tokens": 1922976} +{"current_steps": 3320, "total_steps": 134280, "loss": 0.5179, "lr": 1.2358504617217755e-05, "epoch": 0.494489127196902, "percentage": 2.47, "elapsed_time": "0:12:47", "remaining_time": "8:24:23", "throughput": 2510.33, "total_tokens": 1925952} +{"current_steps": 3325, "total_steps": 134280, "loss": 0.8293, "lr": 1.2377122430741735e-05, "epoch": 0.49523383973786117, "percentage": 2.48, "elapsed_time": "0:12:48", "remaining_time": "8:24:21", "throughput": 2510.46, "total_tokens": 1928928} +{"current_steps": 3330, "total_steps": 134280, "loss": 0.6587, "lr": 1.2395740244265713e-05, "epoch": 0.4959785522788204, "percentage": 2.48, "elapsed_time": "0:12:49", "remaining_time": "8:24:19", "throughput": 2510.5, "total_tokens": 1931808} +{"current_steps": 3335, "total_steps": 134280, "loss": 0.6507, "lr": 1.2414358057789693e-05, "epoch": 0.4967232648197796, "percentage": 2.48, "elapsed_time": "0:12:50", "remaining_time": "8:24:16", "throughput": 2510.45, "total_tokens": 1934528} +{"current_steps": 3340, "total_steps": 134280, "loss": 0.8396, "lr": 1.2432975871313673e-05, "epoch": 0.4974679773607388, "percentage": 2.49, "elapsed_time": "0:12:51", "remaining_time": "8:24:16", "throughput": 2510.51, "total_tokens": 1937568} +{"current_steps": 3345, "total_steps": 134280, "loss": 0.8858, "lr": 1.2451593684837653e-05, "epoch": 0.4982126899016979, "percentage": 2.49, "elapsed_time": "0:12:53", "remaining_time": "8:24:19", "throughput": 2510.63, "total_tokens": 1940832} +{"current_steps": 3350, "total_steps": 134280, "loss": 0.5917, "lr": 1.2470211498361634e-05, "epoch": 0.4989574024426571, "percentage": 2.49, "elapsed_time": "0:12:54", "remaining_time": "8:24:15", "throughput": 2510.6, "total_tokens": 1943520} +{"current_steps": 3355, "total_steps": 134280, "loss": 0.6619, "lr": 1.2488829311885613e-05, "epoch": 0.49970211498361633, "percentage": 2.5, "elapsed_time": "0:12:55", "remaining_time": "8:24:12", "throughput": 2510.55, "total_tokens": 1946240} +{"current_steps": 3360, "total_steps": 134280, "loss": 0.5674, "lr": 1.2507447125409594e-05, "epoch": 0.5004468275245755, "percentage": 2.5, "elapsed_time": "0:12:56", "remaining_time": "8:24:11", "throughput": 2510.63, "total_tokens": 1949248} +{"current_steps": 3365, "total_steps": 134280, "loss": 0.6146, "lr": 1.252606493893357e-05, "epoch": 0.5011915400655347, "percentage": 2.51, "elapsed_time": "0:12:57", "remaining_time": "8:24:10", "throughput": 2510.65, "total_tokens": 1952160} +{"current_steps": 3370, "total_steps": 134280, "loss": 0.5728, "lr": 1.254468275245755e-05, "epoch": 0.5019362526064939, "percentage": 2.51, "elapsed_time": "0:12:58", "remaining_time": "8:24:08", "throughput": 2510.69, "total_tokens": 1955040} +{"current_steps": 3375, "total_steps": 134280, "loss": 0.779, "lr": 1.256330056598153e-05, "epoch": 0.5026809651474531, "percentage": 2.51, "elapsed_time": "0:12:59", "remaining_time": "8:24:06", "throughput": 2510.71, "total_tokens": 1957888} +{"current_steps": 3380, "total_steps": 134280, "loss": 0.707, "lr": 1.258191837950551e-05, "epoch": 0.5034256776884123, "percentage": 2.52, "elapsed_time": "0:13:01", "remaining_time": "8:24:07", "throughput": 2510.75, "total_tokens": 1960992} +{"current_steps": 3385, "total_steps": 134280, "loss": 0.55, "lr": 1.260053619302949e-05, "epoch": 0.5041703902293715, "percentage": 2.52, "elapsed_time": "0:13:02", "remaining_time": "8:24:07", "throughput": 2510.81, "total_tokens": 1963968} +{"current_steps": 3390, "total_steps": 134280, "loss": 0.8192, "lr": 1.2619154006553472e-05, "epoch": 0.5049151027703307, "percentage": 2.52, "elapsed_time": "0:13:03", "remaining_time": "8:24:06", "throughput": 2510.77, "total_tokens": 1966848} +{"current_steps": 3395, "total_steps": 134280, "loss": 0.6152, "lr": 1.2637771820077452e-05, "epoch": 0.5056598153112899, "percentage": 2.53, "elapsed_time": "0:13:04", "remaining_time": "8:24:02", "throughput": 2510.69, "total_tokens": 1969536} +{"current_steps": 3400, "total_steps": 134280, "loss": 0.7087, "lr": 1.2656389633601432e-05, "epoch": 0.506404527852249, "percentage": 2.53, "elapsed_time": "0:13:05", "remaining_time": "8:24:04", "throughput": 2510.8, "total_tokens": 1972704} +{"current_steps": 3405, "total_steps": 134280, "loss": 0.6898, "lr": 1.2675007447125412e-05, "epoch": 0.5071492403932082, "percentage": 2.54, "elapsed_time": "0:13:06", "remaining_time": "8:24:02", "throughput": 2510.81, "total_tokens": 1975552} +{"current_steps": 3410, "total_steps": 134280, "loss": 0.7849, "lr": 1.2693625260649388e-05, "epoch": 0.5078939529341674, "percentage": 2.54, "elapsed_time": "0:13:08", "remaining_time": "8:24:02", "throughput": 2510.94, "total_tokens": 1978624} +{"current_steps": 3415, "total_steps": 134280, "loss": 0.7183, "lr": 1.2712243074173368e-05, "epoch": 0.5086386654751266, "percentage": 2.54, "elapsed_time": "0:13:09", "remaining_time": "8:24:04", "throughput": 2511.0, "total_tokens": 1981824} +{"current_steps": 3420, "total_steps": 134280, "loss": 0.7571, "lr": 1.2730860887697348e-05, "epoch": 0.5093833780160858, "percentage": 2.55, "elapsed_time": "0:13:10", "remaining_time": "8:24:03", "throughput": 2511.02, "total_tokens": 1984736} +{"current_steps": 3425, "total_steps": 134280, "loss": 0.756, "lr": 1.2749478701221328e-05, "epoch": 0.510128090557045, "percentage": 2.55, "elapsed_time": "0:13:11", "remaining_time": "8:24:01", "throughput": 2511.0, "total_tokens": 1987552} +{"current_steps": 3430, "total_steps": 134280, "loss": 0.7049, "lr": 1.276809651474531e-05, "epoch": 0.5108728030980042, "percentage": 2.55, "elapsed_time": "0:13:12", "remaining_time": "8:24:06", "throughput": 2511.05, "total_tokens": 1990880} +{"current_steps": 3435, "total_steps": 134280, "loss": 0.6492, "lr": 1.278671432826929e-05, "epoch": 0.5116175156389634, "percentage": 2.56, "elapsed_time": "0:13:14", "remaining_time": "8:24:08", "throughput": 2511.12, "total_tokens": 1994048} +{"current_steps": 3440, "total_steps": 134280, "loss": 0.6028, "lr": 1.280533214179327e-05, "epoch": 0.5123622281799225, "percentage": 2.56, "elapsed_time": "0:13:15", "remaining_time": "8:24:17", "throughput": 2511.34, "total_tokens": 1997792} +{"current_steps": 3445, "total_steps": 134280, "loss": 0.6615, "lr": 1.282394995531725e-05, "epoch": 0.5131069407208817, "percentage": 2.57, "elapsed_time": "0:13:16", "remaining_time": "8:24:17", "throughput": 2511.33, "total_tokens": 2000800} +{"current_steps": 3450, "total_steps": 134280, "loss": 0.634, "lr": 1.2842567768841226e-05, "epoch": 0.5138516532618409, "percentage": 2.57, "elapsed_time": "0:13:17", "remaining_time": "8:24:19", "throughput": 2511.37, "total_tokens": 2003904} +{"current_steps": 3455, "total_steps": 134280, "loss": 0.7966, "lr": 1.2861185582365206e-05, "epoch": 0.5145963658028001, "percentage": 2.57, "elapsed_time": "0:13:19", "remaining_time": "8:24:20", "throughput": 2511.35, "total_tokens": 2006944} +{"current_steps": 3460, "total_steps": 134280, "loss": 0.661, "lr": 1.2879803395889186e-05, "epoch": 0.5153410783437593, "percentage": 2.58, "elapsed_time": "0:13:20", "remaining_time": "8:24:26", "throughput": 2511.51, "total_tokens": 2010496} +{"current_steps": 3465, "total_steps": 134280, "loss": 0.6873, "lr": 1.2898421209413166e-05, "epoch": 0.5160857908847185, "percentage": 2.58, "elapsed_time": "0:13:21", "remaining_time": "8:24:26", "throughput": 2511.48, "total_tokens": 2013408} +{"current_steps": 3470, "total_steps": 134280, "loss": 0.7084, "lr": 1.2917039022937148e-05, "epoch": 0.5168305034256777, "percentage": 2.58, "elapsed_time": "0:13:22", "remaining_time": "8:24:22", "throughput": 2511.34, "total_tokens": 2016032} +{"current_steps": 3475, "total_steps": 134280, "loss": 0.6944, "lr": 1.2935656836461127e-05, "epoch": 0.5175752159666369, "percentage": 2.59, "elapsed_time": "0:13:23", "remaining_time": "8:24:18", "throughput": 2511.34, "total_tokens": 2018752} +{"current_steps": 3480, "total_steps": 134280, "loss": 0.7907, "lr": 1.2954274649985107e-05, "epoch": 0.5183199285075961, "percentage": 2.59, "elapsed_time": "0:13:24", "remaining_time": "8:24:16", "throughput": 2511.31, "total_tokens": 2021600} +{"current_steps": 3485, "total_steps": 134280, "loss": 0.8082, "lr": 1.2972892463509087e-05, "epoch": 0.5190646410485552, "percentage": 2.6, "elapsed_time": "0:13:26", "remaining_time": "8:24:16", "throughput": 2511.26, "total_tokens": 2024544} +{"current_steps": 3490, "total_steps": 134280, "loss": 0.778, "lr": 1.2991510277033067e-05, "epoch": 0.5198093535895144, "percentage": 2.6, "elapsed_time": "0:13:27", "remaining_time": "8:24:17", "throughput": 2511.26, "total_tokens": 2027552} +{"current_steps": 3495, "total_steps": 134280, "loss": 0.6248, "lr": 1.3010128090557044e-05, "epoch": 0.5205540661304736, "percentage": 2.6, "elapsed_time": "0:13:28", "remaining_time": "8:24:17", "throughput": 2511.38, "total_tokens": 2030656} +{"current_steps": 3500, "total_steps": 134280, "loss": 0.7026, "lr": 1.3028745904081024e-05, "epoch": 0.5212987786714328, "percentage": 2.61, "elapsed_time": "0:13:29", "remaining_time": "8:24:15", "throughput": 2511.48, "total_tokens": 2033600} +{"current_steps": 3505, "total_steps": 134280, "loss": 0.6897, "lr": 1.3047363717605005e-05, "epoch": 0.522043491212392, "percentage": 2.61, "elapsed_time": "0:13:30", "remaining_time": "8:24:15", "throughput": 2511.5, "total_tokens": 2036544} +{"current_steps": 3510, "total_steps": 134280, "loss": 0.6061, "lr": 1.3065981531128985e-05, "epoch": 0.5227882037533512, "percentage": 2.61, "elapsed_time": "0:13:32", "remaining_time": "8:24:12", "throughput": 2511.51, "total_tokens": 2039392} +{"current_steps": 3515, "total_steps": 134280, "loss": 0.7028, "lr": 1.3084599344652965e-05, "epoch": 0.5235329162943104, "percentage": 2.62, "elapsed_time": "0:13:33", "remaining_time": "8:24:08", "throughput": 2511.48, "total_tokens": 2042080} +{"current_steps": 3520, "total_steps": 134280, "loss": 0.7189, "lr": 1.3103217158176945e-05, "epoch": 0.5242776288352696, "percentage": 2.62, "elapsed_time": "0:13:34", "remaining_time": "8:24:07", "throughput": 2511.54, "total_tokens": 2044992} +{"current_steps": 3525, "total_steps": 134280, "loss": 0.7385, "lr": 1.3121834971700925e-05, "epoch": 0.5250223413762288, "percentage": 2.63, "elapsed_time": "0:13:35", "remaining_time": "8:24:04", "throughput": 2511.5, "total_tokens": 2047776} +{"current_steps": 3530, "total_steps": 134280, "loss": 0.6774, "lr": 1.3140452785224905e-05, "epoch": 0.5257670539171879, "percentage": 2.63, "elapsed_time": "0:13:36", "remaining_time": "8:24:04", "throughput": 2511.6, "total_tokens": 2050816} +{"current_steps": 3535, "total_steps": 134280, "loss": 0.7314, "lr": 1.3159070598748885e-05, "epoch": 0.5265117664581471, "percentage": 2.63, "elapsed_time": "0:13:37", "remaining_time": "8:24:05", "throughput": 2511.72, "total_tokens": 2053952} +{"current_steps": 3540, "total_steps": 134280, "loss": 0.649, "lr": 1.3177688412272861e-05, "epoch": 0.5272564789991063, "percentage": 2.64, "elapsed_time": "0:13:38", "remaining_time": "8:24:03", "throughput": 2511.77, "total_tokens": 2056896} +{"current_steps": 3545, "total_steps": 134280, "loss": 0.6511, "lr": 1.3196306225796843e-05, "epoch": 0.5280011915400655, "percentage": 2.64, "elapsed_time": "0:13:40", "remaining_time": "8:24:02", "throughput": 2511.76, "total_tokens": 2059776} +{"current_steps": 3550, "total_steps": 134280, "loss": 0.6617, "lr": 1.3214924039320823e-05, "epoch": 0.5287459040810247, "percentage": 2.64, "elapsed_time": "0:13:41", "remaining_time": "8:24:03", "throughput": 2511.84, "total_tokens": 2062880} +{"current_steps": 3555, "total_steps": 134280, "loss": 0.6682, "lr": 1.3233541852844803e-05, "epoch": 0.5294906166219839, "percentage": 2.65, "elapsed_time": "0:13:42", "remaining_time": "8:24:02", "throughput": 2511.89, "total_tokens": 2065856} +{"current_steps": 3560, "total_steps": 134280, "loss": 0.7425, "lr": 1.3252159666368783e-05, "epoch": 0.5302353291629431, "percentage": 2.65, "elapsed_time": "0:13:43", "remaining_time": "8:23:59", "throughput": 2511.95, "total_tokens": 2068704} +{"current_steps": 3565, "total_steps": 134280, "loss": 0.6277, "lr": 1.3270777479892763e-05, "epoch": 0.5309800417039023, "percentage": 2.65, "elapsed_time": "0:13:44", "remaining_time": "8:23:56", "throughput": 2511.96, "total_tokens": 2071488} +{"current_steps": 3570, "total_steps": 134280, "loss": 0.7199, "lr": 1.3289395293416743e-05, "epoch": 0.5317247542448614, "percentage": 2.66, "elapsed_time": "0:13:45", "remaining_time": "8:23:56", "throughput": 2511.95, "total_tokens": 2074432} +{"current_steps": 3575, "total_steps": 134280, "loss": 0.6071, "lr": 1.3308013106940723e-05, "epoch": 0.5324694667858206, "percentage": 2.66, "elapsed_time": "0:13:46", "remaining_time": "8:23:52", "throughput": 2511.92, "total_tokens": 2077120} +{"current_steps": 3580, "total_steps": 134280, "loss": 0.6444, "lr": 1.33266309204647e-05, "epoch": 0.5332141793267798, "percentage": 2.67, "elapsed_time": "0:13:48", "remaining_time": "8:23:50", "throughput": 2511.93, "total_tokens": 2079968} +{"current_steps": 3585, "total_steps": 134280, "loss": 0.6063, "lr": 1.334524873398868e-05, "epoch": 0.533958891867739, "percentage": 2.67, "elapsed_time": "0:13:49", "remaining_time": "8:23:48", "throughput": 2511.84, "total_tokens": 2082784} +{"current_steps": 3590, "total_steps": 134280, "loss": 0.5577, "lr": 1.336386654751266e-05, "epoch": 0.5347036044086982, "percentage": 2.67, "elapsed_time": "0:13:50", "remaining_time": "8:23:50", "throughput": 2511.88, "total_tokens": 2085920} +{"current_steps": 3595, "total_steps": 134280, "loss": 0.6994, "lr": 1.338248436103664e-05, "epoch": 0.5354483169496574, "percentage": 2.68, "elapsed_time": "0:13:51", "remaining_time": "8:23:47", "throughput": 2511.78, "total_tokens": 2088608} +{"current_steps": 3600, "total_steps": 134280, "loss": 0.6861, "lr": 1.340110217456062e-05, "epoch": 0.5361930294906166, "percentage": 2.68, "elapsed_time": "0:13:52", "remaining_time": "8:23:46", "throughput": 2511.82, "total_tokens": 2091584} +{"current_steps": 3605, "total_steps": 134280, "loss": 0.6381, "lr": 1.34197199880846e-05, "epoch": 0.5369377420315758, "percentage": 2.68, "elapsed_time": "0:13:53", "remaining_time": "8:23:43", "throughput": 2511.74, "total_tokens": 2094272} +{"current_steps": 3610, "total_steps": 134280, "loss": 0.5996, "lr": 1.343833780160858e-05, "epoch": 0.537682454572535, "percentage": 2.69, "elapsed_time": "0:13:54", "remaining_time": "8:23:43", "throughput": 2511.87, "total_tokens": 2097344} +{"current_steps": 3615, "total_steps": 134280, "loss": 0.5358, "lr": 1.345695561513256e-05, "epoch": 0.5384271671134941, "percentage": 2.69, "elapsed_time": "0:13:56", "remaining_time": "8:23:41", "throughput": 2511.85, "total_tokens": 2100192} +{"current_steps": 3620, "total_steps": 134280, "loss": 0.6525, "lr": 1.347557342865654e-05, "epoch": 0.5391718796544533, "percentage": 2.7, "elapsed_time": "0:13:57", "remaining_time": "8:23:40", "throughput": 2511.92, "total_tokens": 2103136} +{"current_steps": 3625, "total_steps": 134280, "loss": 0.9127, "lr": 1.3494191242180519e-05, "epoch": 0.5399165921954125, "percentage": 2.7, "elapsed_time": "0:13:58", "remaining_time": "8:23:40", "throughput": 2512.05, "total_tokens": 2106272} +{"current_steps": 3630, "total_steps": 134280, "loss": 0.453, "lr": 1.3512809055704498e-05, "epoch": 0.5406613047363718, "percentage": 2.7, "elapsed_time": "0:13:59", "remaining_time": "8:23:42", "throughput": 2512.08, "total_tokens": 2109440} +{"current_steps": 3635, "total_steps": 134280, "loss": 0.7638, "lr": 1.3531426869228478e-05, "epoch": 0.541406017277331, "percentage": 2.71, "elapsed_time": "0:14:00", "remaining_time": "8:23:41", "throughput": 2512.07, "total_tokens": 2112352} +{"current_steps": 3640, "total_steps": 134280, "loss": 0.5561, "lr": 1.3550044682752458e-05, "epoch": 0.5421507298182902, "percentage": 2.71, "elapsed_time": "0:14:02", "remaining_time": "8:23:39", "throughput": 2512.08, "total_tokens": 2115200} +{"current_steps": 3645, "total_steps": 134280, "loss": 0.7983, "lr": 1.3568662496276438e-05, "epoch": 0.5428954423592494, "percentage": 2.71, "elapsed_time": "0:14:03", "remaining_time": "8:23:39", "throughput": 2512.06, "total_tokens": 2118112} +{"current_steps": 3650, "total_steps": 134280, "loss": 0.617, "lr": 1.3587280309800418e-05, "epoch": 0.5436401549002086, "percentage": 2.72, "elapsed_time": "0:14:04", "remaining_time": "8:23:38", "throughput": 2512.0, "total_tokens": 2121024} +{"current_steps": 3655, "total_steps": 134280, "loss": 0.6809, "lr": 1.3605898123324398e-05, "epoch": 0.5443848674411678, "percentage": 2.72, "elapsed_time": "0:14:05", "remaining_time": "8:23:35", "throughput": 2511.89, "total_tokens": 2123680} +{"current_steps": 3660, "total_steps": 134280, "loss": 0.6942, "lr": 1.3624515936848378e-05, "epoch": 0.5451295799821269, "percentage": 2.73, "elapsed_time": "0:14:06", "remaining_time": "8:23:37", "throughput": 2511.88, "total_tokens": 2126784} +{"current_steps": 3665, "total_steps": 134280, "loss": 0.7233, "lr": 1.3643133750372358e-05, "epoch": 0.5458742925230861, "percentage": 2.73, "elapsed_time": "0:14:07", "remaining_time": "8:23:34", "throughput": 2511.82, "total_tokens": 2129504} +{"current_steps": 3670, "total_steps": 134280, "loss": 0.7416, "lr": 1.3661751563896336e-05, "epoch": 0.5466190050640453, "percentage": 2.73, "elapsed_time": "0:14:08", "remaining_time": "8:23:32", "throughput": 2511.83, "total_tokens": 2132416} +{"current_steps": 3675, "total_steps": 134280, "loss": 0.6461, "lr": 1.3680369377420316e-05, "epoch": 0.5473637176050045, "percentage": 2.74, "elapsed_time": "0:14:10", "remaining_time": "8:23:30", "throughput": 2511.83, "total_tokens": 2135264} +{"current_steps": 3680, "total_steps": 134280, "loss": 0.8017, "lr": 1.3698987190944296e-05, "epoch": 0.5481084301459637, "percentage": 2.74, "elapsed_time": "0:14:11", "remaining_time": "8:23:33", "throughput": 2511.92, "total_tokens": 2138496} +{"current_steps": 3685, "total_steps": 134280, "loss": 0.6224, "lr": 1.3717605004468276e-05, "epoch": 0.5488531426869229, "percentage": 2.74, "elapsed_time": "0:14:12", "remaining_time": "8:23:31", "throughput": 2511.9, "total_tokens": 2141344} +{"current_steps": 3690, "total_steps": 134280, "loss": 0.7116, "lr": 1.3736222817992256e-05, "epoch": 0.5495978552278821, "percentage": 2.75, "elapsed_time": "0:14:13", "remaining_time": "8:23:30", "throughput": 2511.9, "total_tokens": 2144256} +{"current_steps": 3695, "total_steps": 134280, "loss": 0.6396, "lr": 1.3754840631516236e-05, "epoch": 0.5503425677688413, "percentage": 2.75, "elapsed_time": "0:14:14", "remaining_time": "8:23:28", "throughput": 2511.83, "total_tokens": 2147040} +{"current_steps": 3700, "total_steps": 134280, "loss": 0.6622, "lr": 1.3773458445040216e-05, "epoch": 0.5510872803098004, "percentage": 2.76, "elapsed_time": "0:14:16", "remaining_time": "8:23:30", "throughput": 2511.82, "total_tokens": 2150144} +{"current_steps": 3705, "total_steps": 134280, "loss": 0.5652, "lr": 1.3792076258564196e-05, "epoch": 0.5518319928507596, "percentage": 2.76, "elapsed_time": "0:14:17", "remaining_time": "8:23:27", "throughput": 2511.69, "total_tokens": 2152864} +{"current_steps": 3710, "total_steps": 134280, "loss": 0.7579, "lr": 1.3810694072088174e-05, "epoch": 0.5525767053917188, "percentage": 2.76, "elapsed_time": "0:14:18", "remaining_time": "8:23:29", "throughput": 2511.75, "total_tokens": 2156032} +{"current_steps": 3715, "total_steps": 134280, "loss": 0.5975, "lr": 1.3829311885612154e-05, "epoch": 0.553321417932678, "percentage": 2.77, "elapsed_time": "0:14:19", "remaining_time": "8:23:28", "throughput": 2511.67, "total_tokens": 2158848} +{"current_steps": 3720, "total_steps": 134280, "loss": 0.6901, "lr": 1.3847929699136134e-05, "epoch": 0.5540661304736372, "percentage": 2.77, "elapsed_time": "0:14:20", "remaining_time": "8:23:26", "throughput": 2511.66, "total_tokens": 2161664} +{"current_steps": 3725, "total_steps": 134280, "loss": 0.6474, "lr": 1.3866547512660114e-05, "epoch": 0.5548108430145964, "percentage": 2.77, "elapsed_time": "0:14:21", "remaining_time": "8:23:23", "throughput": 2511.73, "total_tokens": 2164544} +{"current_steps": 3730, "total_steps": 134280, "loss": 0.7883, "lr": 1.3885165326184094e-05, "epoch": 0.5555555555555556, "percentage": 2.78, "elapsed_time": "0:14:22", "remaining_time": "8:23:20", "throughput": 2511.57, "total_tokens": 2167168} +{"current_steps": 3735, "total_steps": 134280, "loss": 0.6118, "lr": 1.3903783139708073e-05, "epoch": 0.5563002680965148, "percentage": 2.78, "elapsed_time": "0:14:24", "remaining_time": "8:23:18", "throughput": 2511.5, "total_tokens": 2169952} +{"current_steps": 3740, "total_steps": 134280, "loss": 0.7325, "lr": 1.3922400953232053e-05, "epoch": 0.557044980637474, "percentage": 2.79, "elapsed_time": "0:14:25", "remaining_time": "8:23:23", "throughput": 2511.6, "total_tokens": 2173376} +{"current_steps": 3745, "total_steps": 134280, "loss": 0.7374, "lr": 1.3941018766756033e-05, "epoch": 0.5577896931784331, "percentage": 2.79, "elapsed_time": "0:14:26", "remaining_time": "8:23:20", "throughput": 2511.49, "total_tokens": 2176032} +{"current_steps": 3750, "total_steps": 134280, "loss": 0.6254, "lr": 1.3959636580280013e-05, "epoch": 0.5585344057193923, "percentage": 2.79, "elapsed_time": "0:14:27", "remaining_time": "8:23:20", "throughput": 2511.63, "total_tokens": 2179136} +{"current_steps": 3755, "total_steps": 134280, "loss": 0.6224, "lr": 1.3978254393803992e-05, "epoch": 0.5592791182603515, "percentage": 2.8, "elapsed_time": "0:14:28", "remaining_time": "8:23:17", "throughput": 2511.61, "total_tokens": 2181920} +{"current_steps": 3760, "total_steps": 134280, "loss": 0.7511, "lr": 1.3996872207327971e-05, "epoch": 0.5600238308013107, "percentage": 2.8, "elapsed_time": "0:14:30", "remaining_time": "8:23:31", "throughput": 2511.82, "total_tokens": 2186080} +{"current_steps": 3765, "total_steps": 134280, "loss": 0.7493, "lr": 1.4015490020851951e-05, "epoch": 0.5607685433422699, "percentage": 2.8, "elapsed_time": "0:14:31", "remaining_time": "8:23:30", "throughput": 2511.9, "total_tokens": 2189120} +{"current_steps": 3770, "total_steps": 134280, "loss": 0.5897, "lr": 1.4034107834375931e-05, "epoch": 0.5615132558832291, "percentage": 2.81, "elapsed_time": "0:14:32", "remaining_time": "8:23:26", "throughput": 2511.8, "total_tokens": 2191744} +{"current_steps": 3775, "total_steps": 134280, "loss": 0.7681, "lr": 1.4052725647899911e-05, "epoch": 0.5622579684241883, "percentage": 2.81, "elapsed_time": "0:14:33", "remaining_time": "8:23:27", "throughput": 2511.84, "total_tokens": 2194816} +{"current_steps": 3780, "total_steps": 134280, "loss": 0.6599, "lr": 1.4071343461423891e-05, "epoch": 0.5630026809651475, "percentage": 2.82, "elapsed_time": "0:14:34", "remaining_time": "8:23:22", "throughput": 2511.68, "total_tokens": 2197312} +{"current_steps": 3785, "total_steps": 134280, "loss": 0.5713, "lr": 1.4089961274947871e-05, "epoch": 0.5637473935061067, "percentage": 2.82, "elapsed_time": "0:14:36", "remaining_time": "8:23:24", "throughput": 2511.74, "total_tokens": 2200448} +{"current_steps": 3790, "total_steps": 134280, "loss": 0.8252, "lr": 1.4108579088471851e-05, "epoch": 0.5644921060470658, "percentage": 2.82, "elapsed_time": "0:14:37", "remaining_time": "8:23:23", "throughput": 2511.71, "total_tokens": 2203392} +{"current_steps": 3795, "total_steps": 134280, "loss": 0.5102, "lr": 1.412719690199583e-05, "epoch": 0.565236818588025, "percentage": 2.83, "elapsed_time": "0:14:38", "remaining_time": "8:23:20", "throughput": 2511.66, "total_tokens": 2206112} +{"current_steps": 3800, "total_steps": 134280, "loss": 0.7887, "lr": 1.4145814715519809e-05, "epoch": 0.5659815311289842, "percentage": 2.83, "elapsed_time": "0:14:39", "remaining_time": "8:23:21", "throughput": 2511.72, "total_tokens": 2209216} +{"current_steps": 3805, "total_steps": 134280, "loss": 0.744, "lr": 1.4164432529043789e-05, "epoch": 0.5667262436699434, "percentage": 2.83, "elapsed_time": "0:14:40", "remaining_time": "8:23:17", "throughput": 2511.62, "total_tokens": 2211840} +{"current_steps": 3810, "total_steps": 134280, "loss": 0.6134, "lr": 1.4183050342567769e-05, "epoch": 0.5674709562109026, "percentage": 2.84, "elapsed_time": "0:14:41", "remaining_time": "8:23:18", "throughput": 2511.6, "total_tokens": 2214848} +{"current_steps": 3815, "total_steps": 134280, "loss": 0.6613, "lr": 1.4201668156091749e-05, "epoch": 0.5682156687518618, "percentage": 2.84, "elapsed_time": "0:14:43", "remaining_time": "8:23:17", "throughput": 2511.51, "total_tokens": 2217696} +{"current_steps": 3820, "total_steps": 134280, "loss": 0.7119, "lr": 1.4220285969615729e-05, "epoch": 0.568960381292821, "percentage": 2.84, "elapsed_time": "0:14:44", "remaining_time": "8:23:15", "throughput": 2511.41, "total_tokens": 2220480} +{"current_steps": 3825, "total_steps": 134280, "loss": 0.6886, "lr": 1.4238903783139709e-05, "epoch": 0.5697050938337802, "percentage": 2.85, "elapsed_time": "0:14:45", "remaining_time": "8:23:13", "throughput": 2511.29, "total_tokens": 2223200} +{"current_steps": 3830, "total_steps": 134280, "loss": 0.7906, "lr": 1.4257521596663689e-05, "epoch": 0.5704498063747393, "percentage": 2.85, "elapsed_time": "0:14:46", "remaining_time": "8:23:11", "throughput": 2511.25, "total_tokens": 2226048} +{"current_steps": 3835, "total_steps": 134280, "loss": 0.8421, "lr": 1.4276139410187669e-05, "epoch": 0.5711945189156985, "percentage": 2.86, "elapsed_time": "0:14:47", "remaining_time": "8:23:11", "throughput": 2511.29, "total_tokens": 2229024} +{"current_steps": 3840, "total_steps": 134280, "loss": 0.7467, "lr": 1.4294757223711647e-05, "epoch": 0.5719392314566577, "percentage": 2.86, "elapsed_time": "0:14:48", "remaining_time": "8:23:10", "throughput": 2511.34, "total_tokens": 2232032} +{"current_steps": 3845, "total_steps": 134280, "loss": 0.6569, "lr": 1.4313375037235627e-05, "epoch": 0.5726839439976169, "percentage": 2.86, "elapsed_time": "0:14:49", "remaining_time": "8:23:07", "throughput": 2511.32, "total_tokens": 2234752} +{"current_steps": 3850, "total_steps": 134280, "loss": 0.5667, "lr": 1.4331992850759607e-05, "epoch": 0.5734286565385761, "percentage": 2.87, "elapsed_time": "0:14:51", "remaining_time": "8:23:06", "throughput": 2511.33, "total_tokens": 2237664} +{"current_steps": 3855, "total_steps": 134280, "loss": 0.6606, "lr": 1.4350610664283587e-05, "epoch": 0.5741733690795353, "percentage": 2.87, "elapsed_time": "0:14:52", "remaining_time": "8:23:04", "throughput": 2511.3, "total_tokens": 2240480} +{"current_steps": 3860, "total_steps": 134280, "loss": 0.5931, "lr": 1.4369228477807567e-05, "epoch": 0.5749180816204945, "percentage": 2.87, "elapsed_time": "0:14:53", "remaining_time": "8:23:02", "throughput": 2511.21, "total_tokens": 2243264} +{"current_steps": 3865, "total_steps": 134280, "loss": 0.6804, "lr": 1.4387846291331546e-05, "epoch": 0.5756627941614537, "percentage": 2.88, "elapsed_time": "0:14:54", "remaining_time": "8:23:02", "throughput": 2511.22, "total_tokens": 2246304} +{"current_steps": 3870, "total_steps": 134280, "loss": 0.6043, "lr": 1.4406464104855526e-05, "epoch": 0.5764075067024129, "percentage": 2.88, "elapsed_time": "0:14:55", "remaining_time": "8:23:03", "throughput": 2511.12, "total_tokens": 2249216} +{"current_steps": 3875, "total_steps": 134280, "loss": 0.7326, "lr": 1.4425081918379506e-05, "epoch": 0.577152219243372, "percentage": 2.89, "elapsed_time": "0:14:56", "remaining_time": "8:22:59", "throughput": 2511.06, "total_tokens": 2251904} +{"current_steps": 3880, "total_steps": 134280, "loss": 0.7494, "lr": 1.4443699731903488e-05, "epoch": 0.5778969317843312, "percentage": 2.89, "elapsed_time": "0:14:57", "remaining_time": "8:22:59", "throughput": 2511.1, "total_tokens": 2254880} +{"current_steps": 3885, "total_steps": 134280, "loss": 0.6677, "lr": 1.4462317545427465e-05, "epoch": 0.5786416443252904, "percentage": 2.89, "elapsed_time": "0:14:59", "remaining_time": "8:22:59", "throughput": 2511.1, "total_tokens": 2257888} +{"current_steps": 3890, "total_steps": 134280, "loss": 0.6836, "lr": 1.4480935358951444e-05, "epoch": 0.5793863568662496, "percentage": 2.9, "elapsed_time": "0:15:00", "remaining_time": "8:22:57", "throughput": 2511.07, "total_tokens": 2260736} +{"current_steps": 3895, "total_steps": 134280, "loss": 0.8824, "lr": 1.4499553172475424e-05, "epoch": 0.5801310694072088, "percentage": 2.9, "elapsed_time": "0:15:01", "remaining_time": "8:23:00", "throughput": 2511.09, "total_tokens": 2263968} +{"current_steps": 3900, "total_steps": 134280, "loss": 0.6216, "lr": 1.4518170985999404e-05, "epoch": 0.580875781948168, "percentage": 2.9, "elapsed_time": "0:15:02", "remaining_time": "8:22:56", "throughput": 2510.96, "total_tokens": 2266560} +{"current_steps": 3905, "total_steps": 134280, "loss": 0.6052, "lr": 1.4536788799523384e-05, "epoch": 0.5816204944891272, "percentage": 2.91, "elapsed_time": "0:15:03", "remaining_time": "8:22:54", "throughput": 2510.95, "total_tokens": 2269376} +{"current_steps": 3910, "total_steps": 134280, "loss": 0.6531, "lr": 1.4555406613047364e-05, "epoch": 0.5823652070300864, "percentage": 2.91, "elapsed_time": "0:15:04", "remaining_time": "8:22:53", "throughput": 2510.96, "total_tokens": 2272320} +{"current_steps": 3915, "total_steps": 134280, "loss": 0.6911, "lr": 1.4574024426571346e-05, "epoch": 0.5831099195710456, "percentage": 2.92, "elapsed_time": "0:15:06", "remaining_time": "8:22:53", "throughput": 2510.99, "total_tokens": 2275328} +{"current_steps": 3920, "total_steps": 134280, "loss": 0.7766, "lr": 1.4592642240095326e-05, "epoch": 0.5838546321120047, "percentage": 2.92, "elapsed_time": "0:15:07", "remaining_time": "8:22:51", "throughput": 2511.04, "total_tokens": 2278240} +{"current_steps": 3925, "total_steps": 134280, "loss": 0.7741, "lr": 1.4611260053619302e-05, "epoch": 0.5845993446529639, "percentage": 2.92, "elapsed_time": "0:15:08", "remaining_time": "8:22:53", "throughput": 2511.18, "total_tokens": 2281504} +{"current_steps": 3930, "total_steps": 134280, "loss": 0.6095, "lr": 1.4629877867143282e-05, "epoch": 0.5853440571939231, "percentage": 2.93, "elapsed_time": "0:15:09", "remaining_time": "8:22:52", "throughput": 2511.14, "total_tokens": 2284320} +{"current_steps": 3935, "total_steps": 134280, "loss": 0.6819, "lr": 1.4648495680667262e-05, "epoch": 0.5860887697348823, "percentage": 2.93, "elapsed_time": "0:15:10", "remaining_time": "8:22:50", "throughput": 2511.16, "total_tokens": 2287232} +{"current_steps": 3940, "total_steps": 134280, "loss": 0.7502, "lr": 1.4667113494191242e-05, "epoch": 0.5868334822758415, "percentage": 2.93, "elapsed_time": "0:15:11", "remaining_time": "8:22:49", "throughput": 2511.24, "total_tokens": 2290176} +{"current_steps": 3945, "total_steps": 134280, "loss": 0.6566, "lr": 1.4685731307715222e-05, "epoch": 0.5875781948168007, "percentage": 2.94, "elapsed_time": "0:15:13", "remaining_time": "8:22:45", "throughput": 2511.17, "total_tokens": 2292832} +{"current_steps": 3950, "total_steps": 134280, "loss": 0.7481, "lr": 1.4704349121239202e-05, "epoch": 0.5883229073577599, "percentage": 2.94, "elapsed_time": "0:15:14", "remaining_time": "8:22:44", "throughput": 2511.14, "total_tokens": 2295712} +{"current_steps": 3955, "total_steps": 134280, "loss": 0.7638, "lr": 1.4722966934763183e-05, "epoch": 0.5890676198987191, "percentage": 2.95, "elapsed_time": "0:15:15", "remaining_time": "8:22:40", "throughput": 2511.14, "total_tokens": 2298432} +{"current_steps": 3960, "total_steps": 134280, "loss": 0.64, "lr": 1.4741584748287163e-05, "epoch": 0.5898123324396782, "percentage": 2.95, "elapsed_time": "0:15:16", "remaining_time": "8:22:40", "throughput": 2511.12, "total_tokens": 2301408} +{"current_steps": 3965, "total_steps": 134280, "loss": 0.6958, "lr": 1.4760202561811143e-05, "epoch": 0.5905570449806374, "percentage": 2.95, "elapsed_time": "0:15:17", "remaining_time": "8:22:41", "throughput": 2511.2, "total_tokens": 2304512} +{"current_steps": 3970, "total_steps": 134280, "loss": 0.6482, "lr": 1.477882037533512e-05, "epoch": 0.5913017575215966, "percentage": 2.96, "elapsed_time": "0:15:18", "remaining_time": "8:22:41", "throughput": 2511.27, "total_tokens": 2307584} +{"current_steps": 3975, "total_steps": 134280, "loss": 0.8006, "lr": 1.47974381888591e-05, "epoch": 0.5920464700625558, "percentage": 2.96, "elapsed_time": "0:15:20", "remaining_time": "8:22:39", "throughput": 2511.2, "total_tokens": 2310336} +{"current_steps": 3980, "total_steps": 134280, "loss": 0.6007, "lr": 1.481605600238308e-05, "epoch": 0.592791182603515, "percentage": 2.96, "elapsed_time": "0:15:21", "remaining_time": "8:22:41", "throughput": 2511.33, "total_tokens": 2313600} +{"current_steps": 3985, "total_steps": 134280, "loss": 0.6414, "lr": 1.483467381590706e-05, "epoch": 0.5935358951444742, "percentage": 2.97, "elapsed_time": "0:15:22", "remaining_time": "8:22:38", "throughput": 2511.38, "total_tokens": 2316448} +{"current_steps": 3990, "total_steps": 134280, "loss": 0.8485, "lr": 1.485329162943104e-05, "epoch": 0.5942806076854334, "percentage": 2.97, "elapsed_time": "0:15:23", "remaining_time": "8:22:41", "throughput": 2511.38, "total_tokens": 2319648} +{"current_steps": 3995, "total_steps": 134280, "loss": 0.6882, "lr": 1.4871909442955021e-05, "epoch": 0.5950253202263927, "percentage": 2.98, "elapsed_time": "0:15:24", "remaining_time": "8:22:39", "throughput": 2511.36, "total_tokens": 2322496} +{"current_steps": 4000, "total_steps": 134280, "loss": 0.7479, "lr": 1.4890527256479001e-05, "epoch": 0.5957700327673519, "percentage": 2.98, "elapsed_time": "0:15:26", "remaining_time": "8:22:39", "throughput": 2511.41, "total_tokens": 2325568} +{"current_steps": 4005, "total_steps": 134280, "loss": 0.7032, "lr": 1.4909145070002981e-05, "epoch": 0.596514745308311, "percentage": 2.98, "elapsed_time": "0:15:27", "remaining_time": "8:22:38", "throughput": 2511.47, "total_tokens": 2328512} +{"current_steps": 4010, "total_steps": 134280, "loss": 0.7906, "lr": 1.4927762883526961e-05, "epoch": 0.5972594578492701, "percentage": 2.99, "elapsed_time": "0:15:28", "remaining_time": "8:22:39", "throughput": 2511.48, "total_tokens": 2331584} +{"current_steps": 4015, "total_steps": 134280, "loss": 0.6899, "lr": 1.4946380697050938e-05, "epoch": 0.5980041703902294, "percentage": 2.99, "elapsed_time": "0:15:29", "remaining_time": "8:22:38", "throughput": 2511.49, "total_tokens": 2334528} +{"current_steps": 4020, "total_steps": 134280, "loss": 0.8384, "lr": 1.4964998510574917e-05, "epoch": 0.5987488829311886, "percentage": 2.99, "elapsed_time": "0:15:30", "remaining_time": "8:22:38", "throughput": 2511.6, "total_tokens": 2337600} +{"current_steps": 4025, "total_steps": 134280, "loss": 0.6599, "lr": 1.4983616324098897e-05, "epoch": 0.5994935954721478, "percentage": 3.0, "elapsed_time": "0:15:31", "remaining_time": "8:22:36", "throughput": 2511.61, "total_tokens": 2340480} +{"current_steps": 4030, "total_steps": 134280, "loss": 0.7664, "lr": 1.5002234137622877e-05, "epoch": 0.600238308013107, "percentage": 3.0, "elapsed_time": "0:15:32", "remaining_time": "8:22:33", "throughput": 2511.58, "total_tokens": 2343232} +{"current_steps": 4035, "total_steps": 134280, "loss": 0.6779, "lr": 1.5020851951146859e-05, "epoch": 0.6009830205540662, "percentage": 3.0, "elapsed_time": "0:15:34", "remaining_time": "8:22:30", "throughput": 2511.51, "total_tokens": 2345920} +{"current_steps": 4040, "total_steps": 134280, "loss": 0.7613, "lr": 1.5039469764670839e-05, "epoch": 0.6017277330950254, "percentage": 3.01, "elapsed_time": "0:15:35", "remaining_time": "8:22:33", "throughput": 2511.62, "total_tokens": 2349248} +{"current_steps": 4045, "total_steps": 134280, "loss": 0.5671, "lr": 1.5058087578194819e-05, "epoch": 0.6024724456359845, "percentage": 3.01, "elapsed_time": "0:15:36", "remaining_time": "8:22:33", "throughput": 2511.62, "total_tokens": 2352224} +{"current_steps": 4050, "total_steps": 134280, "loss": 0.518, "lr": 1.5076705391718799e-05, "epoch": 0.6032171581769437, "percentage": 3.02, "elapsed_time": "0:15:37", "remaining_time": "8:22:30", "throughput": 2511.65, "total_tokens": 2355040} +{"current_steps": 4055, "total_steps": 134280, "loss": 0.7075, "lr": 1.5095323205242775e-05, "epoch": 0.6039618707179029, "percentage": 3.02, "elapsed_time": "0:15:38", "remaining_time": "8:22:27", "throughput": 2511.58, "total_tokens": 2357728} +{"current_steps": 4060, "total_steps": 134280, "loss": 0.691, "lr": 1.5113941018766755e-05, "epoch": 0.6047065832588621, "percentage": 3.02, "elapsed_time": "0:15:39", "remaining_time": "8:22:26", "throughput": 2511.59, "total_tokens": 2360672} +{"current_steps": 4065, "total_steps": 134280, "loss": 0.6898, "lr": 1.5132558832290735e-05, "epoch": 0.6054512957998213, "percentage": 3.03, "elapsed_time": "0:15:41", "remaining_time": "8:22:23", "throughput": 2511.55, "total_tokens": 2363424} +{"current_steps": 4070, "total_steps": 134280, "loss": 0.6257, "lr": 1.5151176645814715e-05, "epoch": 0.6061960083407805, "percentage": 3.03, "elapsed_time": "0:15:42", "remaining_time": "8:22:23", "throughput": 2511.57, "total_tokens": 2366368} +{"current_steps": 4075, "total_steps": 134280, "loss": 0.7648, "lr": 1.5169794459338697e-05, "epoch": 0.6069407208817397, "percentage": 3.03, "elapsed_time": "0:15:43", "remaining_time": "8:22:22", "throughput": 2511.58, "total_tokens": 2369312} +{"current_steps": 4080, "total_steps": 134280, "loss": 0.5453, "lr": 1.5188412272862677e-05, "epoch": 0.6076854334226989, "percentage": 3.04, "elapsed_time": "0:15:44", "remaining_time": "8:22:22", "throughput": 2511.61, "total_tokens": 2372352} +{"current_steps": 4085, "total_steps": 134280, "loss": 0.5228, "lr": 1.5207030086386656e-05, "epoch": 0.6084301459636581, "percentage": 3.04, "elapsed_time": "0:15:45", "remaining_time": "8:22:20", "throughput": 2511.64, "total_tokens": 2375264} +{"current_steps": 4090, "total_steps": 134280, "loss": 0.6214, "lr": 1.5225647899910636e-05, "epoch": 0.6091748585046172, "percentage": 3.05, "elapsed_time": "0:15:46", "remaining_time": "8:22:18", "throughput": 2511.57, "total_tokens": 2377984} +{"current_steps": 4095, "total_steps": 134280, "loss": 0.6884, "lr": 1.5244265713434616e-05, "epoch": 0.6099195710455764, "percentage": 3.05, "elapsed_time": "0:15:48", "remaining_time": "8:22:18", "throughput": 2511.67, "total_tokens": 2381120} +{"current_steps": 4100, "total_steps": 134280, "loss": 0.8576, "lr": 1.5262883526958593e-05, "epoch": 0.6106642835865356, "percentage": 3.05, "elapsed_time": "0:15:49", "remaining_time": "8:22:15", "throughput": 2511.59, "total_tokens": 2383744} +{"current_steps": 4105, "total_steps": 134280, "loss": 0.5319, "lr": 1.5281501340482574e-05, "epoch": 0.6114089961274948, "percentage": 3.06, "elapsed_time": "0:15:50", "remaining_time": "8:22:11", "throughput": 2511.56, "total_tokens": 2386432} +{"current_steps": 4110, "total_steps": 134280, "loss": 0.7601, "lr": 1.5300119154006553e-05, "epoch": 0.612153708668454, "percentage": 3.06, "elapsed_time": "0:15:51", "remaining_time": "8:22:09", "throughput": 2511.57, "total_tokens": 2389312} +{"current_steps": 4115, "total_steps": 134280, "loss": 0.6554, "lr": 1.5318736967530534e-05, "epoch": 0.6128984212094132, "percentage": 3.06, "elapsed_time": "0:15:52", "remaining_time": "8:22:11", "throughput": 2511.74, "total_tokens": 2392608} +{"current_steps": 4120, "total_steps": 134280, "loss": 0.5395, "lr": 1.5337354781054513e-05, "epoch": 0.6136431337503724, "percentage": 3.07, "elapsed_time": "0:15:53", "remaining_time": "8:22:07", "throughput": 2511.71, "total_tokens": 2395296} +{"current_steps": 4125, "total_steps": 134280, "loss": 0.5465, "lr": 1.5355972594578494e-05, "epoch": 0.6143878462913316, "percentage": 3.07, "elapsed_time": "0:15:54", "remaining_time": "8:22:05", "throughput": 2511.74, "total_tokens": 2398112} +{"current_steps": 4130, "total_steps": 134280, "loss": 0.6946, "lr": 1.5374590408102472e-05, "epoch": 0.6151325588322908, "percentage": 3.08, "elapsed_time": "0:15:55", "remaining_time": "8:22:00", "throughput": 2511.68, "total_tokens": 2400704} +{"current_steps": 4135, "total_steps": 134280, "loss": 0.5321, "lr": 1.5393208221626454e-05, "epoch": 0.6158772713732499, "percentage": 3.08, "elapsed_time": "0:15:56", "remaining_time": "8:21:57", "throughput": 2511.61, "total_tokens": 2403392} +{"current_steps": 4140, "total_steps": 134280, "loss": 0.524, "lr": 1.5411826035150436e-05, "epoch": 0.6166219839142091, "percentage": 3.08, "elapsed_time": "0:15:58", "remaining_time": "8:21:57", "throughput": 2511.69, "total_tokens": 2406432} +{"current_steps": 4145, "total_steps": 134280, "loss": 0.7399, "lr": 1.543044384867441e-05, "epoch": 0.6173666964551683, "percentage": 3.09, "elapsed_time": "0:15:59", "remaining_time": "8:21:56", "throughput": 2511.75, "total_tokens": 2409376} +{"current_steps": 4150, "total_steps": 134280, "loss": 0.8324, "lr": 1.5449061662198392e-05, "epoch": 0.6181114089961275, "percentage": 3.09, "elapsed_time": "0:16:00", "remaining_time": "8:22:01", "throughput": 2511.84, "total_tokens": 2412864} +{"current_steps": 4155, "total_steps": 134280, "loss": 0.7606, "lr": 1.546767947572237e-05, "epoch": 0.6188561215370867, "percentage": 3.09, "elapsed_time": "0:16:01", "remaining_time": "8:21:59", "throughput": 2511.83, "total_tokens": 2415744} +{"current_steps": 4160, "total_steps": 134280, "loss": 0.7688, "lr": 1.5486297289246352e-05, "epoch": 0.6196008340780459, "percentage": 3.1, "elapsed_time": "0:16:02", "remaining_time": "8:21:57", "throughput": 2511.85, "total_tokens": 2418560} +{"current_steps": 4165, "total_steps": 134280, "loss": 0.6139, "lr": 1.550491510277033e-05, "epoch": 0.6203455466190051, "percentage": 3.1, "elapsed_time": "0:16:04", "remaining_time": "8:21:55", "throughput": 2511.85, "total_tokens": 2421440} +{"current_steps": 4170, "total_steps": 134280, "loss": 0.7516, "lr": 1.5523532916294312e-05, "epoch": 0.6210902591599643, "percentage": 3.11, "elapsed_time": "0:16:05", "remaining_time": "8:21:57", "throughput": 2511.93, "total_tokens": 2424640} +{"current_steps": 4175, "total_steps": 134280, "loss": 0.7258, "lr": 1.554215072981829e-05, "epoch": 0.6218349717009234, "percentage": 3.11, "elapsed_time": "0:16:06", "remaining_time": "8:21:56", "throughput": 2511.87, "total_tokens": 2427488} +{"current_steps": 4180, "total_steps": 134280, "loss": 0.6075, "lr": 1.5560768543342272e-05, "epoch": 0.6225796842418826, "percentage": 3.11, "elapsed_time": "0:16:07", "remaining_time": "8:21:53", "throughput": 2511.82, "total_tokens": 2430208} +{"current_steps": 4185, "total_steps": 134280, "loss": 0.6871, "lr": 1.557938635686625e-05, "epoch": 0.6233243967828418, "percentage": 3.12, "elapsed_time": "0:16:08", "remaining_time": "8:21:49", "throughput": 2511.73, "total_tokens": 2432864} +{"current_steps": 4190, "total_steps": 134280, "loss": 0.6759, "lr": 1.5598004170390228e-05, "epoch": 0.624069109323801, "percentage": 3.12, "elapsed_time": "0:16:09", "remaining_time": "8:21:49", "throughput": 2511.75, "total_tokens": 2435840} +{"current_steps": 4195, "total_steps": 134280, "loss": 0.6742, "lr": 1.561662198391421e-05, "epoch": 0.6248138218647602, "percentage": 3.12, "elapsed_time": "0:16:10", "remaining_time": "8:21:46", "throughput": 2511.74, "total_tokens": 2438560} +{"current_steps": 4200, "total_steps": 134280, "loss": 0.6982, "lr": 1.5635239797438188e-05, "epoch": 0.6255585344057194, "percentage": 3.13, "elapsed_time": "0:16:11", "remaining_time": "8:21:43", "throughput": 2511.73, "total_tokens": 2441376} +{"current_steps": 4205, "total_steps": 134280, "loss": 0.7313, "lr": 1.565385761096217e-05, "epoch": 0.6263032469466786, "percentage": 3.13, "elapsed_time": "0:16:13", "remaining_time": "8:21:42", "throughput": 2511.76, "total_tokens": 2444288} +{"current_steps": 4210, "total_steps": 134280, "loss": 0.6454, "lr": 1.5672475424486148e-05, "epoch": 0.6270479594876378, "percentage": 3.14, "elapsed_time": "0:16:14", "remaining_time": "8:21:41", "throughput": 2511.75, "total_tokens": 2447168} +{"current_steps": 4215, "total_steps": 134280, "loss": 0.617, "lr": 1.569109323801013e-05, "epoch": 0.627792672028597, "percentage": 3.14, "elapsed_time": "0:16:15", "remaining_time": "8:21:41", "throughput": 2511.79, "total_tokens": 2450240} +{"current_steps": 4220, "total_steps": 134280, "loss": 0.7659, "lr": 1.570971105153411e-05, "epoch": 0.6285373845695561, "percentage": 3.14, "elapsed_time": "0:16:16", "remaining_time": "8:21:39", "throughput": 2511.74, "total_tokens": 2453024} +{"current_steps": 4225, "total_steps": 134280, "loss": 0.6774, "lr": 1.572832886505809e-05, "epoch": 0.6292820971105153, "percentage": 3.15, "elapsed_time": "0:16:17", "remaining_time": "8:21:37", "throughput": 2511.78, "total_tokens": 2455872} +{"current_steps": 4230, "total_steps": 134280, "loss": 0.6786, "lr": 1.5746946678582068e-05, "epoch": 0.6300268096514745, "percentage": 3.15, "elapsed_time": "0:16:18", "remaining_time": "8:21:34", "throughput": 2511.76, "total_tokens": 2458624} +{"current_steps": 4235, "total_steps": 134280, "loss": 0.7309, "lr": 1.5765564492106046e-05, "epoch": 0.6307715221924337, "percentage": 3.15, "elapsed_time": "0:16:19", "remaining_time": "8:21:30", "throughput": 2511.73, "total_tokens": 2461312} +{"current_steps": 4240, "total_steps": 134280, "loss": 0.8002, "lr": 1.5784182305630027e-05, "epoch": 0.6315162347333929, "percentage": 3.16, "elapsed_time": "0:16:21", "remaining_time": "8:21:29", "throughput": 2511.86, "total_tokens": 2464352} +{"current_steps": 4245, "total_steps": 134280, "loss": 0.7207, "lr": 1.5802800119154006e-05, "epoch": 0.6322609472743521, "percentage": 3.16, "elapsed_time": "0:16:22", "remaining_time": "8:21:27", "throughput": 2511.73, "total_tokens": 2467040} +{"current_steps": 4250, "total_steps": 134280, "loss": 0.6339, "lr": 1.5821417932677987e-05, "epoch": 0.6330056598153113, "percentage": 3.17, "elapsed_time": "0:16:23", "remaining_time": "8:21:27", "throughput": 2511.8, "total_tokens": 2470112} +{"current_steps": 4255, "total_steps": 134280, "loss": 0.7237, "lr": 1.5840035746201966e-05, "epoch": 0.6337503723562705, "percentage": 3.17, "elapsed_time": "0:16:24", "remaining_time": "8:21:23", "throughput": 2511.74, "total_tokens": 2472768} +{"current_steps": 4260, "total_steps": 134280, "loss": 0.6379, "lr": 1.5858653559725947e-05, "epoch": 0.6344950848972297, "percentage": 3.17, "elapsed_time": "0:16:25", "remaining_time": "8:21:25", "throughput": 2511.82, "total_tokens": 2475936} +{"current_steps": 4265, "total_steps": 134280, "loss": 0.6915, "lr": 1.587727137324993e-05, "epoch": 0.6352397974381888, "percentage": 3.18, "elapsed_time": "0:16:26", "remaining_time": "8:21:22", "throughput": 2511.8, "total_tokens": 2478688} +{"current_steps": 4270, "total_steps": 134280, "loss": 0.7229, "lr": 1.5895889186773907e-05, "epoch": 0.635984509979148, "percentage": 3.18, "elapsed_time": "0:16:28", "remaining_time": "8:21:23", "throughput": 2511.76, "total_tokens": 2481728} +{"current_steps": 4275, "total_steps": 134280, "loss": 0.6041, "lr": 1.5914507000297885e-05, "epoch": 0.6367292225201072, "percentage": 3.18, "elapsed_time": "0:16:29", "remaining_time": "8:21:19", "throughput": 2511.74, "total_tokens": 2484416} +{"current_steps": 4280, "total_steps": 134280, "loss": 0.6263, "lr": 1.5933124813821863e-05, "epoch": 0.6374739350610664, "percentage": 3.19, "elapsed_time": "0:16:30", "remaining_time": "8:21:17", "throughput": 2511.76, "total_tokens": 2487296} +{"current_steps": 4285, "total_steps": 134280, "loss": 0.776, "lr": 1.5951742627345845e-05, "epoch": 0.6382186476020256, "percentage": 3.19, "elapsed_time": "0:16:31", "remaining_time": "8:21:17", "throughput": 2511.88, "total_tokens": 2490336} +{"current_steps": 4290, "total_steps": 134280, "loss": 0.7149, "lr": 1.5970360440869823e-05, "epoch": 0.6389633601429848, "percentage": 3.19, "elapsed_time": "0:16:32", "remaining_time": "8:21:18", "throughput": 2512.02, "total_tokens": 2493600} +{"current_steps": 4295, "total_steps": 134280, "loss": 0.5709, "lr": 1.5988978254393805e-05, "epoch": 0.639708072683944, "percentage": 3.2, "elapsed_time": "0:16:33", "remaining_time": "8:21:15", "throughput": 2512.0, "total_tokens": 2496352} +{"current_steps": 4300, "total_steps": 134280, "loss": 0.7099, "lr": 1.6007596067917787e-05, "epoch": 0.6404527852249032, "percentage": 3.2, "elapsed_time": "0:16:34", "remaining_time": "8:21:14", "throughput": 2512.06, "total_tokens": 2499296} +{"current_steps": 4305, "total_steps": 134280, "loss": 0.5969, "lr": 1.6026213881441765e-05, "epoch": 0.6411974977658623, "percentage": 3.21, "elapsed_time": "0:16:36", "remaining_time": "8:21:12", "throughput": 2512.02, "total_tokens": 2502080} +{"current_steps": 4310, "total_steps": 134280, "loss": 0.6048, "lr": 1.6044831694965746e-05, "epoch": 0.6419422103068215, "percentage": 3.21, "elapsed_time": "0:16:37", "remaining_time": "8:21:09", "throughput": 2511.97, "total_tokens": 2504832} +{"current_steps": 4315, "total_steps": 134280, "loss": 0.5826, "lr": 1.606344950848972e-05, "epoch": 0.6426869228477807, "percentage": 3.21, "elapsed_time": "0:16:38", "remaining_time": "8:21:08", "throughput": 2512.01, "total_tokens": 2507776} +{"current_steps": 4320, "total_steps": 134280, "loss": 0.6808, "lr": 1.6082067322013703e-05, "epoch": 0.6434316353887399, "percentage": 3.22, "elapsed_time": "0:16:39", "remaining_time": "8:21:07", "throughput": 2512.06, "total_tokens": 2510720} +{"current_steps": 4325, "total_steps": 134280, "loss": 0.5799, "lr": 1.610068513553768e-05, "epoch": 0.6441763479296991, "percentage": 3.22, "elapsed_time": "0:16:40", "remaining_time": "8:21:06", "throughput": 2512.01, "total_tokens": 2513600} +{"current_steps": 4330, "total_steps": 134280, "loss": 0.6946, "lr": 1.6119302949061663e-05, "epoch": 0.6449210604706583, "percentage": 3.22, "elapsed_time": "0:16:41", "remaining_time": "8:21:05", "throughput": 2512.07, "total_tokens": 2516576} +{"current_steps": 4335, "total_steps": 134280, "loss": 0.7297, "lr": 1.6137920762585644e-05, "epoch": 0.6456657730116175, "percentage": 3.23, "elapsed_time": "0:16:42", "remaining_time": "8:21:02", "throughput": 2512.06, "total_tokens": 2519296} +{"current_steps": 4340, "total_steps": 134280, "loss": 0.7145, "lr": 1.6156538576109623e-05, "epoch": 0.6464104855525767, "percentage": 3.23, "elapsed_time": "0:16:44", "remaining_time": "8:21:00", "throughput": 2512.03, "total_tokens": 2522112} +{"current_steps": 4345, "total_steps": 134280, "loss": 0.7483, "lr": 1.6175156389633604e-05, "epoch": 0.6471551980935359, "percentage": 3.24, "elapsed_time": "0:16:45", "remaining_time": "8:21:01", "throughput": 2512.1, "total_tokens": 2525280} +{"current_steps": 4350, "total_steps": 134280, "loss": 0.7761, "lr": 1.6193774203157582e-05, "epoch": 0.647899910634495, "percentage": 3.24, "elapsed_time": "0:16:46", "remaining_time": "8:21:00", "throughput": 2512.22, "total_tokens": 2528288} +{"current_steps": 4355, "total_steps": 134280, "loss": 0.8533, "lr": 1.6212392016681564e-05, "epoch": 0.6486446231754542, "percentage": 3.24, "elapsed_time": "0:16:47", "remaining_time": "8:20:57", "throughput": 2512.17, "total_tokens": 2531040} +{"current_steps": 4360, "total_steps": 134280, "loss": 0.7357, "lr": 1.623100983020554e-05, "epoch": 0.6493893357164134, "percentage": 3.25, "elapsed_time": "0:16:48", "remaining_time": "8:20:56", "throughput": 2512.2, "total_tokens": 2533952} +{"current_steps": 4365, "total_steps": 134280, "loss": 0.5815, "lr": 1.624962764372952e-05, "epoch": 0.6501340482573726, "percentage": 3.25, "elapsed_time": "0:16:49", "remaining_time": "8:20:55", "throughput": 2512.19, "total_tokens": 2536864} +{"current_steps": 4370, "total_steps": 134280, "loss": 0.5752, "lr": 1.62682454572535e-05, "epoch": 0.6508787607983318, "percentage": 3.25, "elapsed_time": "0:16:50", "remaining_time": "8:20:52", "throughput": 2512.13, "total_tokens": 2539552} +{"current_steps": 4375, "total_steps": 134280, "loss": 0.6837, "lr": 1.628686327077748e-05, "epoch": 0.651623473339291, "percentage": 3.26, "elapsed_time": "0:16:51", "remaining_time": "8:20:48", "throughput": 2512.07, "total_tokens": 2542208} +{"current_steps": 4380, "total_steps": 134280, "loss": 0.7524, "lr": 1.6305481084301462e-05, "epoch": 0.6523681858802503, "percentage": 3.26, "elapsed_time": "0:16:53", "remaining_time": "8:20:47", "throughput": 2512.11, "total_tokens": 2545152} +{"current_steps": 4385, "total_steps": 134280, "loss": 0.7809, "lr": 1.632409889782544e-05, "epoch": 0.6531128984212095, "percentage": 3.27, "elapsed_time": "0:16:54", "remaining_time": "8:20:46", "throughput": 2512.11, "total_tokens": 2548032} +{"current_steps": 4390, "total_steps": 134280, "loss": 0.6854, "lr": 1.6342716711349422e-05, "epoch": 0.6538576109621687, "percentage": 3.27, "elapsed_time": "0:16:55", "remaining_time": "8:20:45", "throughput": 2512.09, "total_tokens": 2550976} +{"current_steps": 4395, "total_steps": 134280, "loss": 0.6981, "lr": 1.63613345248734e-05, "epoch": 0.6546023235031277, "percentage": 3.27, "elapsed_time": "0:16:56", "remaining_time": "8:20:48", "throughput": 2512.2, "total_tokens": 2554336} +{"current_steps": 4400, "total_steps": 134280, "loss": 0.7461, "lr": 1.637995233839738e-05, "epoch": 0.655347036044087, "percentage": 3.28, "elapsed_time": "0:16:58", "remaining_time": "8:20:49", "throughput": 2512.26, "total_tokens": 2557504} +{"current_steps": 4405, "total_steps": 134280, "loss": 0.6743, "lr": 1.6398570151921357e-05, "epoch": 0.6560917485850462, "percentage": 3.28, "elapsed_time": "0:16:59", "remaining_time": "8:20:47", "throughput": 2512.23, "total_tokens": 2560288} +{"current_steps": 4410, "total_steps": 134280, "loss": 0.6685, "lr": 1.6417187965445338e-05, "epoch": 0.6568364611260054, "percentage": 3.28, "elapsed_time": "0:17:00", "remaining_time": "8:20:45", "throughput": 2512.25, "total_tokens": 2563136} +{"current_steps": 4415, "total_steps": 134280, "loss": 0.5547, "lr": 1.643580577896932e-05, "epoch": 0.6575811736669646, "percentage": 3.29, "elapsed_time": "0:17:01", "remaining_time": "8:20:45", "throughput": 2512.25, "total_tokens": 2566144} +{"current_steps": 4420, "total_steps": 134280, "loss": 0.5959, "lr": 1.6454423592493298e-05, "epoch": 0.6583258862079238, "percentage": 3.29, "elapsed_time": "0:17:02", "remaining_time": "8:20:42", "throughput": 2512.16, "total_tokens": 2568800} +{"current_steps": 4425, "total_steps": 134280, "loss": 0.7216, "lr": 1.647304140601728e-05, "epoch": 0.659070598748883, "percentage": 3.3, "elapsed_time": "0:17:03", "remaining_time": "8:20:41", "throughput": 2512.24, "total_tokens": 2571840} +{"current_steps": 4430, "total_steps": 134280, "loss": 0.6654, "lr": 1.6491659219541258e-05, "epoch": 0.6598153112898422, "percentage": 3.3, "elapsed_time": "0:17:04", "remaining_time": "8:20:40", "throughput": 2512.19, "total_tokens": 2574688} +{"current_steps": 4435, "total_steps": 134280, "loss": 0.6754, "lr": 1.651027703306524e-05, "epoch": 0.6605600238308013, "percentage": 3.3, "elapsed_time": "0:17:05", "remaining_time": "8:20:37", "throughput": 2512.16, "total_tokens": 2577376} +{"current_steps": 4440, "total_steps": 134280, "loss": 0.7805, "lr": 1.6528894846589218e-05, "epoch": 0.6613047363717605, "percentage": 3.31, "elapsed_time": "0:17:07", "remaining_time": "8:20:37", "throughput": 2512.24, "total_tokens": 2580448} +{"current_steps": 4445, "total_steps": 134280, "loss": 0.6887, "lr": 1.6547512660113196e-05, "epoch": 0.6620494489127197, "percentage": 3.31, "elapsed_time": "0:17:08", "remaining_time": "8:20:34", "throughput": 2512.15, "total_tokens": 2583168} +{"current_steps": 4450, "total_steps": 134280, "loss": 0.65, "lr": 1.6566130473637174e-05, "epoch": 0.6627941614536789, "percentage": 3.31, "elapsed_time": "0:17:09", "remaining_time": "8:20:33", "throughput": 2512.12, "total_tokens": 2585984} +{"current_steps": 4455, "total_steps": 134280, "loss": 0.9295, "lr": 1.6584748287161156e-05, "epoch": 0.6635388739946381, "percentage": 3.32, "elapsed_time": "0:17:10", "remaining_time": "8:20:32", "throughput": 2512.13, "total_tokens": 2588928} +{"current_steps": 4460, "total_steps": 134280, "loss": 0.6916, "lr": 1.6603366100685137e-05, "epoch": 0.6642835865355973, "percentage": 3.32, "elapsed_time": "0:17:11", "remaining_time": "8:20:29", "throughput": 2512.05, "total_tokens": 2591584} +{"current_steps": 4465, "total_steps": 134280, "loss": 0.7145, "lr": 1.6621983914209116e-05, "epoch": 0.6650282990765565, "percentage": 3.33, "elapsed_time": "0:17:12", "remaining_time": "8:20:28", "throughput": 2512.04, "total_tokens": 2594496} +{"current_steps": 4470, "total_steps": 134280, "loss": 0.7004, "lr": 1.6640601727733097e-05, "epoch": 0.6657730116175157, "percentage": 3.33, "elapsed_time": "0:17:13", "remaining_time": "8:20:26", "throughput": 2512.07, "total_tokens": 2597408} +{"current_steps": 4475, "total_steps": 134280, "loss": 0.546, "lr": 1.6659219541257075e-05, "epoch": 0.6665177241584749, "percentage": 3.33, "elapsed_time": "0:17:15", "remaining_time": "8:20:25", "throughput": 2512.1, "total_tokens": 2600320} +{"current_steps": 4480, "total_steps": 134280, "loss": 0.5762, "lr": 1.6677837354781057e-05, "epoch": 0.667262436699434, "percentage": 3.34, "elapsed_time": "0:17:16", "remaining_time": "8:20:22", "throughput": 2512.07, "total_tokens": 2603072} +{"current_steps": 4485, "total_steps": 134280, "loss": 0.9108, "lr": 1.6696455168305035e-05, "epoch": 0.6680071492403932, "percentage": 3.34, "elapsed_time": "0:17:17", "remaining_time": "8:20:19", "throughput": 2511.99, "total_tokens": 2605728} +{"current_steps": 4490, "total_steps": 134280, "loss": 0.5766, "lr": 1.6715072981829014e-05, "epoch": 0.6687518617813524, "percentage": 3.34, "elapsed_time": "0:17:18", "remaining_time": "8:20:16", "throughput": 2511.86, "total_tokens": 2608320} +{"current_steps": 4495, "total_steps": 134280, "loss": 0.6795, "lr": 1.6733690795352995e-05, "epoch": 0.6694965743223116, "percentage": 3.35, "elapsed_time": "0:17:19", "remaining_time": "8:20:14", "throughput": 2511.9, "total_tokens": 2611168} +{"current_steps": 4500, "total_steps": 134280, "loss": 0.6201, "lr": 1.6752308608876973e-05, "epoch": 0.6702412868632708, "percentage": 3.35, "elapsed_time": "0:17:20", "remaining_time": "8:20:13", "throughput": 2511.85, "total_tokens": 2614016} +{"current_steps": 4505, "total_steps": 134280, "loss": 0.6952, "lr": 1.6770926422400955e-05, "epoch": 0.67098599940423, "percentage": 3.35, "elapsed_time": "0:17:21", "remaining_time": "8:20:11", "throughput": 2511.83, "total_tokens": 2616864} +{"current_steps": 4510, "total_steps": 134280, "loss": 0.8006, "lr": 1.6789544235924933e-05, "epoch": 0.6717307119451892, "percentage": 3.36, "elapsed_time": "0:17:22", "remaining_time": "8:20:10", "throughput": 2511.81, "total_tokens": 2619808} +{"current_steps": 4515, "total_steps": 134280, "loss": 0.6527, "lr": 1.6808162049448915e-05, "epoch": 0.6724754244861484, "percentage": 3.36, "elapsed_time": "0:17:24", "remaining_time": "8:20:07", "throughput": 2511.77, "total_tokens": 2622464} +{"current_steps": 4520, "total_steps": 134280, "loss": 0.6563, "lr": 1.6826779862972893e-05, "epoch": 0.6732201370271076, "percentage": 3.37, "elapsed_time": "0:17:25", "remaining_time": "8:20:05", "throughput": 2511.71, "total_tokens": 2625216} +{"current_steps": 4525, "total_steps": 134280, "loss": 0.6822, "lr": 1.6845397676496875e-05, "epoch": 0.6739648495680667, "percentage": 3.37, "elapsed_time": "0:17:26", "remaining_time": "8:20:03", "throughput": 2511.7, "total_tokens": 2628096} +{"current_steps": 4530, "total_steps": 134280, "loss": 0.7743, "lr": 1.6864015490020853e-05, "epoch": 0.6747095621090259, "percentage": 3.37, "elapsed_time": "0:17:27", "remaining_time": "8:20:03", "throughput": 2511.7, "total_tokens": 2631072} +{"current_steps": 4535, "total_steps": 134280, "loss": 0.6206, "lr": 1.688263330354483e-05, "epoch": 0.6754542746499851, "percentage": 3.38, "elapsed_time": "0:17:28", "remaining_time": "8:20:02", "throughput": 2511.71, "total_tokens": 2634016} +{"current_steps": 4540, "total_steps": 134280, "loss": 0.6163, "lr": 1.6901251117068813e-05, "epoch": 0.6761989871909443, "percentage": 3.38, "elapsed_time": "0:17:29", "remaining_time": "8:20:05", "throughput": 2511.85, "total_tokens": 2637376} +{"current_steps": 4545, "total_steps": 134280, "loss": 0.6561, "lr": 1.691986893059279e-05, "epoch": 0.6769436997319035, "percentage": 3.38, "elapsed_time": "0:17:31", "remaining_time": "8:20:03", "throughput": 2511.83, "total_tokens": 2640192} +{"current_steps": 4550, "total_steps": 134280, "loss": 0.7016, "lr": 1.6938486744116773e-05, "epoch": 0.6776884122728627, "percentage": 3.39, "elapsed_time": "0:17:32", "remaining_time": "8:20:00", "throughput": 2511.87, "total_tokens": 2643040} +{"current_steps": 4555, "total_steps": 134280, "loss": 0.5584, "lr": 1.695710455764075e-05, "epoch": 0.6784331248138219, "percentage": 3.39, "elapsed_time": "0:17:33", "remaining_time": "8:19:59", "throughput": 2511.85, "total_tokens": 2645856} +{"current_steps": 4560, "total_steps": 134280, "loss": 0.8073, "lr": 1.6975722371164733e-05, "epoch": 0.6791778373547811, "percentage": 3.4, "elapsed_time": "0:17:34", "remaining_time": "8:19:58", "throughput": 2511.93, "total_tokens": 2648928} +{"current_steps": 4565, "total_steps": 134280, "loss": 0.6493, "lr": 1.699434018468871e-05, "epoch": 0.6799225498957402, "percentage": 3.4, "elapsed_time": "0:17:35", "remaining_time": "8:19:56", "throughput": 2511.85, "total_tokens": 2651648} +{"current_steps": 4570, "total_steps": 134280, "loss": 0.6037, "lr": 1.7012957998212692e-05, "epoch": 0.6806672624366994, "percentage": 3.4, "elapsed_time": "0:17:36", "remaining_time": "8:19:55", "throughput": 2511.84, "total_tokens": 2654528} +{"current_steps": 4575, "total_steps": 134280, "loss": 0.6446, "lr": 1.703157581173667e-05, "epoch": 0.6814119749776586, "percentage": 3.41, "elapsed_time": "0:17:37", "remaining_time": "8:19:54", "throughput": 2511.79, "total_tokens": 2657376} +{"current_steps": 4580, "total_steps": 134280, "loss": 0.7246, "lr": 1.705019362526065e-05, "epoch": 0.6821566875186178, "percentage": 3.41, "elapsed_time": "0:17:39", "remaining_time": "8:19:51", "throughput": 2511.75, "total_tokens": 2660160} +{"current_steps": 4585, "total_steps": 134280, "loss": 0.623, "lr": 1.706881143878463e-05, "epoch": 0.682901400059577, "percentage": 3.41, "elapsed_time": "0:17:40", "remaining_time": "8:19:54", "throughput": 2511.84, "total_tokens": 2663520} +{"current_steps": 4590, "total_steps": 134280, "loss": 0.635, "lr": 1.708742925230861e-05, "epoch": 0.6836461126005362, "percentage": 3.42, "elapsed_time": "0:17:41", "remaining_time": "8:19:52", "throughput": 2511.82, "total_tokens": 2666272} +{"current_steps": 4595, "total_steps": 134280, "loss": 0.6925, "lr": 1.710604706583259e-05, "epoch": 0.6843908251414954, "percentage": 3.42, "elapsed_time": "0:17:42", "remaining_time": "8:19:51", "throughput": 2511.86, "total_tokens": 2669248} +{"current_steps": 4600, "total_steps": 134280, "loss": 0.4973, "lr": 1.712466487935657e-05, "epoch": 0.6851355376824546, "percentage": 3.43, "elapsed_time": "0:17:43", "remaining_time": "8:19:50", "throughput": 2511.79, "total_tokens": 2672064} +{"current_steps": 4605, "total_steps": 134280, "loss": 0.7138, "lr": 1.714328269288055e-05, "epoch": 0.6858802502234138, "percentage": 3.43, "elapsed_time": "0:17:44", "remaining_time": "8:19:49", "throughput": 2511.76, "total_tokens": 2675008} +{"current_steps": 4610, "total_steps": 134280, "loss": 0.6883, "lr": 1.716190050640453e-05, "epoch": 0.6866249627643729, "percentage": 3.43, "elapsed_time": "0:17:46", "remaining_time": "8:19:49", "throughput": 2511.82, "total_tokens": 2678080} +{"current_steps": 4615, "total_steps": 134280, "loss": 0.7876, "lr": 1.718051831992851e-05, "epoch": 0.6873696753053321, "percentage": 3.44, "elapsed_time": "0:17:47", "remaining_time": "8:19:48", "throughput": 2511.83, "total_tokens": 2680960} +{"current_steps": 4620, "total_steps": 134280, "loss": 0.679, "lr": 1.7199136133452488e-05, "epoch": 0.6881143878462913, "percentage": 3.44, "elapsed_time": "0:17:48", "remaining_time": "8:19:47", "throughput": 2511.84, "total_tokens": 2683904} +{"current_steps": 4625, "total_steps": 134280, "loss": 0.6107, "lr": 1.7217753946976467e-05, "epoch": 0.6888591003872505, "percentage": 3.44, "elapsed_time": "0:17:49", "remaining_time": "8:19:46", "throughput": 2511.88, "total_tokens": 2686880} +{"current_steps": 4630, "total_steps": 134280, "loss": 0.65, "lr": 1.7236371760500448e-05, "epoch": 0.6896038129282097, "percentage": 3.45, "elapsed_time": "0:17:50", "remaining_time": "8:19:43", "throughput": 2511.83, "total_tokens": 2689536} +{"current_steps": 4635, "total_steps": 134280, "loss": 0.6951, "lr": 1.7254989574024426e-05, "epoch": 0.6903485254691689, "percentage": 3.45, "elapsed_time": "0:17:51", "remaining_time": "8:19:41", "throughput": 2511.82, "total_tokens": 2692384} +{"current_steps": 4640, "total_steps": 134280, "loss": 0.8068, "lr": 1.7273607387548408e-05, "epoch": 0.6910932380101281, "percentage": 3.46, "elapsed_time": "0:17:53", "remaining_time": "8:19:42", "throughput": 2511.81, "total_tokens": 2695424} +{"current_steps": 4645, "total_steps": 134280, "loss": 0.747, "lr": 1.7292225201072386e-05, "epoch": 0.6918379505510873, "percentage": 3.46, "elapsed_time": "0:17:54", "remaining_time": "8:19:41", "throughput": 2511.86, "total_tokens": 2698464} +{"current_steps": 4650, "total_steps": 134280, "loss": 0.5177, "lr": 1.7310843014596368e-05, "epoch": 0.6925826630920465, "percentage": 3.46, "elapsed_time": "0:17:55", "remaining_time": "8:19:38", "throughput": 2511.86, "total_tokens": 2701184} +{"current_steps": 4655, "total_steps": 134280, "loss": 0.6433, "lr": 1.7329460828120346e-05, "epoch": 0.6933273756330056, "percentage": 3.47, "elapsed_time": "0:17:56", "remaining_time": "8:19:37", "throughput": 2511.89, "total_tokens": 2704160} +{"current_steps": 4660, "total_steps": 134280, "loss": 0.575, "lr": 1.7348078641644328e-05, "epoch": 0.6940720881739648, "percentage": 3.47, "elapsed_time": "0:17:57", "remaining_time": "8:19:35", "throughput": 2511.9, "total_tokens": 2706944} +{"current_steps": 4665, "total_steps": 134280, "loss": 0.7345, "lr": 1.7366696455168306e-05, "epoch": 0.694816800714924, "percentage": 3.47, "elapsed_time": "0:17:58", "remaining_time": "8:19:34", "throughput": 2511.87, "total_tokens": 2709824} +{"current_steps": 4670, "total_steps": 134280, "loss": 0.8231, "lr": 1.7385314268692284e-05, "epoch": 0.6955615132558832, "percentage": 3.48, "elapsed_time": "0:17:59", "remaining_time": "8:19:30", "throughput": 2511.8, "total_tokens": 2712448} +{"current_steps": 4675, "total_steps": 134280, "loss": 0.6853, "lr": 1.7403932082216266e-05, "epoch": 0.6963062257968424, "percentage": 3.48, "elapsed_time": "0:18:01", "remaining_time": "8:19:29", "throughput": 2511.87, "total_tokens": 2715456} +{"current_steps": 4680, "total_steps": 134280, "loss": 0.6136, "lr": 1.7422549895740244e-05, "epoch": 0.6970509383378016, "percentage": 3.49, "elapsed_time": "0:18:02", "remaining_time": "8:19:26", "throughput": 2511.8, "total_tokens": 2718080} +{"current_steps": 4685, "total_steps": 134280, "loss": 0.6125, "lr": 1.7441167709264226e-05, "epoch": 0.6977956508787608, "percentage": 3.49, "elapsed_time": "0:18:03", "remaining_time": "8:19:24", "throughput": 2511.81, "total_tokens": 2720928} +{"current_steps": 4690, "total_steps": 134280, "loss": 0.6998, "lr": 1.7459785522788204e-05, "epoch": 0.69854036341972, "percentage": 3.49, "elapsed_time": "0:18:04", "remaining_time": "8:19:25", "throughput": 2511.87, "total_tokens": 2724096} +{"current_steps": 4695, "total_steps": 134280, "loss": 0.6168, "lr": 1.7478403336312185e-05, "epoch": 0.6992850759606791, "percentage": 3.5, "elapsed_time": "0:18:05", "remaining_time": "8:19:26", "throughput": 2511.95, "total_tokens": 2727264} +{"current_steps": 4700, "total_steps": 134280, "loss": 0.5299, "lr": 1.7497021149836164e-05, "epoch": 0.7000297885016383, "percentage": 3.5, "elapsed_time": "0:18:06", "remaining_time": "8:19:22", "throughput": 2511.81, "total_tokens": 2729760} +{"current_steps": 4705, "total_steps": 134280, "loss": 0.7093, "lr": 1.7515638963360142e-05, "epoch": 0.7007745010425975, "percentage": 3.5, "elapsed_time": "0:18:07", "remaining_time": "8:19:19", "throughput": 2511.76, "total_tokens": 2732416} +{"current_steps": 4710, "total_steps": 134280, "loss": 0.7076, "lr": 1.7534256776884124e-05, "epoch": 0.7015192135835567, "percentage": 3.51, "elapsed_time": "0:18:08", "remaining_time": "8:19:16", "throughput": 2511.66, "total_tokens": 2735072} +{"current_steps": 4715, "total_steps": 134280, "loss": 0.8008, "lr": 1.7552874590408102e-05, "epoch": 0.7022639261245159, "percentage": 3.51, "elapsed_time": "0:18:10", "remaining_time": "8:19:14", "throughput": 2511.6, "total_tokens": 2737792} +{"current_steps": 4720, "total_steps": 134280, "loss": 0.9158, "lr": 1.7571492403932083e-05, "epoch": 0.7030086386654751, "percentage": 3.52, "elapsed_time": "0:18:11", "remaining_time": "8:19:12", "throughput": 2511.63, "total_tokens": 2740704} +{"current_steps": 4725, "total_steps": 134280, "loss": 0.6513, "lr": 1.759011021745606e-05, "epoch": 0.7037533512064343, "percentage": 3.52, "elapsed_time": "0:18:12", "remaining_time": "8:19:10", "throughput": 2511.62, "total_tokens": 2743520} +{"current_steps": 4730, "total_steps": 134280, "loss": 0.5285, "lr": 1.7608728030980043e-05, "epoch": 0.7044980637473935, "percentage": 3.52, "elapsed_time": "0:18:13", "remaining_time": "8:19:08", "throughput": 2511.63, "total_tokens": 2746368} +{"current_steps": 4735, "total_steps": 134280, "loss": 0.607, "lr": 1.762734584450402e-05, "epoch": 0.7052427762883527, "percentage": 3.53, "elapsed_time": "0:18:14", "remaining_time": "8:19:07", "throughput": 2511.59, "total_tokens": 2749184} +{"current_steps": 4740, "total_steps": 134280, "loss": 0.7292, "lr": 1.7645963658028003e-05, "epoch": 0.7059874888293118, "percentage": 3.53, "elapsed_time": "0:18:15", "remaining_time": "8:19:05", "throughput": 2511.52, "total_tokens": 2752000} +{"current_steps": 4745, "total_steps": 134280, "loss": 0.7292, "lr": 1.7664581471551985e-05, "epoch": 0.706732201370271, "percentage": 3.53, "elapsed_time": "0:18:16", "remaining_time": "8:19:03", "throughput": 2511.46, "total_tokens": 2754688} +{"current_steps": 4750, "total_steps": 134280, "loss": 0.8051, "lr": 1.768319928507596e-05, "epoch": 0.7074769139112302, "percentage": 3.54, "elapsed_time": "0:18:17", "remaining_time": "8:19:01", "throughput": 2511.43, "total_tokens": 2757472} +{"current_steps": 4755, "total_steps": 134280, "loss": 0.5923, "lr": 1.770181709859994e-05, "epoch": 0.7082216264521894, "percentage": 3.54, "elapsed_time": "0:18:19", "remaining_time": "8:18:58", "throughput": 2511.45, "total_tokens": 2760288} +{"current_steps": 4760, "total_steps": 134280, "loss": 0.6924, "lr": 1.772043491212392e-05, "epoch": 0.7089663389931486, "percentage": 3.54, "elapsed_time": "0:18:20", "remaining_time": "8:18:55", "throughput": 2511.47, "total_tokens": 2763040} +{"current_steps": 4765, "total_steps": 134280, "loss": 0.8044, "lr": 1.77390527256479e-05, "epoch": 0.7097110515341079, "percentage": 3.55, "elapsed_time": "0:18:21", "remaining_time": "8:18:56", "throughput": 2511.51, "total_tokens": 2766176} +{"current_steps": 4770, "total_steps": 134280, "loss": 0.7327, "lr": 1.775767053917188e-05, "epoch": 0.710455764075067, "percentage": 3.55, "elapsed_time": "0:18:22", "remaining_time": "8:18:57", "throughput": 2511.62, "total_tokens": 2769408} +{"current_steps": 4775, "total_steps": 134280, "loss": 0.7246, "lr": 1.777628835269586e-05, "epoch": 0.7112004766160263, "percentage": 3.56, "elapsed_time": "0:18:23", "remaining_time": "8:18:56", "throughput": 2511.6, "total_tokens": 2772256} +{"current_steps": 4780, "total_steps": 134280, "loss": 0.7145, "lr": 1.779490616621984e-05, "epoch": 0.7119451891569855, "percentage": 3.56, "elapsed_time": "0:18:24", "remaining_time": "8:18:52", "throughput": 2511.55, "total_tokens": 2774912} +{"current_steps": 4785, "total_steps": 134280, "loss": 0.6419, "lr": 1.781352397974382e-05, "epoch": 0.7126899016979446, "percentage": 3.56, "elapsed_time": "0:18:25", "remaining_time": "8:18:50", "throughput": 2511.49, "total_tokens": 2777600} +{"current_steps": 4790, "total_steps": 134280, "loss": 0.5734, "lr": 1.78321417932678e-05, "epoch": 0.7134346142389038, "percentage": 3.57, "elapsed_time": "0:18:27", "remaining_time": "8:18:48", "throughput": 2511.48, "total_tokens": 2780480} +{"current_steps": 4795, "total_steps": 134280, "loss": 0.7599, "lr": 1.7850759606791777e-05, "epoch": 0.714179326779863, "percentage": 3.57, "elapsed_time": "0:18:28", "remaining_time": "8:18:50", "throughput": 2511.52, "total_tokens": 2783648} +{"current_steps": 4800, "total_steps": 134280, "loss": 0.5888, "lr": 1.786937742031576e-05, "epoch": 0.7149240393208222, "percentage": 3.57, "elapsed_time": "0:18:29", "remaining_time": "8:18:51", "throughput": 2511.63, "total_tokens": 2786880} +{"current_steps": 4805, "total_steps": 134280, "loss": 0.6619, "lr": 1.7887995233839737e-05, "epoch": 0.7156687518617814, "percentage": 3.58, "elapsed_time": "0:18:30", "remaining_time": "8:18:47", "throughput": 2511.55, "total_tokens": 2789440} +{"current_steps": 4810, "total_steps": 134280, "loss": 0.6101, "lr": 1.790661304736372e-05, "epoch": 0.7164134644027406, "percentage": 3.58, "elapsed_time": "0:18:31", "remaining_time": "8:18:48", "throughput": 2511.65, "total_tokens": 2792640} +{"current_steps": 4815, "total_steps": 134280, "loss": 0.5928, "lr": 1.7925230860887697e-05, "epoch": 0.7171581769436998, "percentage": 3.59, "elapsed_time": "0:18:33", "remaining_time": "8:18:47", "throughput": 2511.68, "total_tokens": 2795616} +{"current_steps": 4820, "total_steps": 134280, "loss": 0.6766, "lr": 1.794384867441168e-05, "epoch": 0.717902889484659, "percentage": 3.59, "elapsed_time": "0:18:34", "remaining_time": "8:18:47", "throughput": 2511.78, "total_tokens": 2798752} +{"current_steps": 4825, "total_steps": 134280, "loss": 0.7338, "lr": 1.796246648793566e-05, "epoch": 0.7186476020256181, "percentage": 3.59, "elapsed_time": "0:18:35", "remaining_time": "8:18:44", "throughput": 2511.65, "total_tokens": 2801344} +{"current_steps": 4830, "total_steps": 134280, "loss": 0.7075, "lr": 1.798108430145964e-05, "epoch": 0.7193923145665773, "percentage": 3.6, "elapsed_time": "0:18:36", "remaining_time": "8:18:45", "throughput": 2511.64, "total_tokens": 2804384} +{"current_steps": 4835, "total_steps": 134280, "loss": 0.7292, "lr": 1.7999702114983617e-05, "epoch": 0.7201370271075365, "percentage": 3.6, "elapsed_time": "0:18:37", "remaining_time": "8:18:45", "throughput": 2511.65, "total_tokens": 2807456} +{"current_steps": 4840, "total_steps": 134280, "loss": 0.7071, "lr": 1.8018319928507595e-05, "epoch": 0.7208817396484957, "percentage": 3.6, "elapsed_time": "0:18:38", "remaining_time": "8:18:44", "throughput": 2511.66, "total_tokens": 2810400} +{"current_steps": 4845, "total_steps": 134280, "loss": 0.6244, "lr": 1.8036937742031576e-05, "epoch": 0.7216264521894549, "percentage": 3.61, "elapsed_time": "0:18:40", "remaining_time": "8:18:44", "throughput": 2511.71, "total_tokens": 2813408} +{"current_steps": 4850, "total_steps": 134280, "loss": 0.686, "lr": 1.8055555555555555e-05, "epoch": 0.7223711647304141, "percentage": 3.61, "elapsed_time": "0:18:41", "remaining_time": "8:18:43", "throughput": 2511.72, "total_tokens": 2816384} +{"current_steps": 4855, "total_steps": 134280, "loss": 0.8599, "lr": 1.8074173369079536e-05, "epoch": 0.7231158772713733, "percentage": 3.62, "elapsed_time": "0:18:42", "remaining_time": "8:18:43", "throughput": 2511.83, "total_tokens": 2819552} +{"current_steps": 4860, "total_steps": 134280, "loss": 0.5375, "lr": 1.8092791182603515e-05, "epoch": 0.7238605898123325, "percentage": 3.62, "elapsed_time": "0:18:43", "remaining_time": "8:18:42", "throughput": 2511.88, "total_tokens": 2822496} +{"current_steps": 4865, "total_steps": 134280, "loss": 0.7388, "lr": 1.8111408996127496e-05, "epoch": 0.7246053023532917, "percentage": 3.62, "elapsed_time": "0:18:44", "remaining_time": "8:18:41", "throughput": 2511.92, "total_tokens": 2825472} +{"current_steps": 4870, "total_steps": 134280, "loss": 0.5519, "lr": 1.8130026809651478e-05, "epoch": 0.7253500148942508, "percentage": 3.63, "elapsed_time": "0:18:45", "remaining_time": "8:18:39", "throughput": 2511.93, "total_tokens": 2828288} +{"current_steps": 4875, "total_steps": 134280, "loss": 0.7225, "lr": 1.8148644623175456e-05, "epoch": 0.72609472743521, "percentage": 3.63, "elapsed_time": "0:18:47", "remaining_time": "8:18:38", "throughput": 2511.97, "total_tokens": 2831232} +{"current_steps": 4880, "total_steps": 134280, "loss": 0.6105, "lr": 1.8167262436699434e-05, "epoch": 0.7268394399761692, "percentage": 3.63, "elapsed_time": "0:18:48", "remaining_time": "8:18:37", "throughput": 2512.0, "total_tokens": 2834208} +{"current_steps": 4885, "total_steps": 134280, "loss": 0.8269, "lr": 1.8185880250223413e-05, "epoch": 0.7275841525171284, "percentage": 3.64, "elapsed_time": "0:18:49", "remaining_time": "8:18:34", "throughput": 2511.93, "total_tokens": 2836832} +{"current_steps": 4890, "total_steps": 134280, "loss": 0.6729, "lr": 1.8204498063747394e-05, "epoch": 0.7283288650580876, "percentage": 3.64, "elapsed_time": "0:18:50", "remaining_time": "8:18:34", "throughput": 2511.42, "total_tokens": 2839296} +{"current_steps": 4895, "total_steps": 134280, "loss": 0.6464, "lr": 1.8223115877271372e-05, "epoch": 0.7290735775990468, "percentage": 3.65, "elapsed_time": "0:18:51", "remaining_time": "8:18:32", "throughput": 2511.34, "total_tokens": 2842048} +{"current_steps": 4900, "total_steps": 134280, "loss": 0.9101, "lr": 1.8241733690795354e-05, "epoch": 0.729818290140006, "percentage": 3.65, "elapsed_time": "0:18:52", "remaining_time": "8:18:30", "throughput": 2511.35, "total_tokens": 2844896} +{"current_steps": 4905, "total_steps": 134280, "loss": 0.5779, "lr": 1.8260351504319336e-05, "epoch": 0.7305630026809652, "percentage": 3.65, "elapsed_time": "0:18:53", "remaining_time": "8:18:27", "throughput": 2511.3, "total_tokens": 2847552} +{"current_steps": 4910, "total_steps": 134280, "loss": 0.5577, "lr": 1.8278969317843314e-05, "epoch": 0.7313077152219244, "percentage": 3.66, "elapsed_time": "0:18:55", "remaining_time": "8:18:25", "throughput": 2511.31, "total_tokens": 2850368} +{"current_steps": 4915, "total_steps": 134280, "loss": 0.6631, "lr": 1.8297587131367295e-05, "epoch": 0.7320524277628835, "percentage": 3.66, "elapsed_time": "0:18:56", "remaining_time": "8:18:25", "throughput": 2511.26, "total_tokens": 2853344} +{"current_steps": 4920, "total_steps": 134280, "loss": 0.7043, "lr": 1.831620494489127e-05, "epoch": 0.7327971403038427, "percentage": 3.66, "elapsed_time": "0:18:57", "remaining_time": "8:18:25", "throughput": 2511.32, "total_tokens": 2856416} +{"current_steps": 4925, "total_steps": 134280, "loss": 0.6535, "lr": 1.8334822758415252e-05, "epoch": 0.7335418528448019, "percentage": 3.67, "elapsed_time": "0:18:58", "remaining_time": "8:18:25", "throughput": 2511.31, "total_tokens": 2859360} +{"current_steps": 4930, "total_steps": 134280, "loss": 0.6756, "lr": 1.835344057193923e-05, "epoch": 0.7342865653857611, "percentage": 3.67, "elapsed_time": "0:18:59", "remaining_time": "8:18:24", "throughput": 2511.4, "total_tokens": 2862368} +{"current_steps": 4935, "total_steps": 134280, "loss": 0.6647, "lr": 1.8372058385463212e-05, "epoch": 0.7350312779267203, "percentage": 3.68, "elapsed_time": "0:19:00", "remaining_time": "8:18:21", "throughput": 2511.38, "total_tokens": 2865120} +{"current_steps": 4940, "total_steps": 134280, "loss": 0.7099, "lr": 1.8390676198987193e-05, "epoch": 0.7357759904676795, "percentage": 3.68, "elapsed_time": "0:19:02", "remaining_time": "8:18:21", "throughput": 2511.43, "total_tokens": 2868224} +{"current_steps": 4945, "total_steps": 134280, "loss": 0.6059, "lr": 1.840929401251117e-05, "epoch": 0.7365207030086387, "percentage": 3.68, "elapsed_time": "0:19:03", "remaining_time": "8:18:22", "throughput": 2511.48, "total_tokens": 2871360} +{"current_steps": 4950, "total_steps": 134280, "loss": 0.5068, "lr": 1.8427911826035153e-05, "epoch": 0.7372654155495979, "percentage": 3.69, "elapsed_time": "0:19:04", "remaining_time": "8:18:23", "throughput": 2511.52, "total_tokens": 2874496} +{"current_steps": 4955, "total_steps": 134280, "loss": 0.7657, "lr": 1.844652963955913e-05, "epoch": 0.738010128090557, "percentage": 3.69, "elapsed_time": "0:19:05", "remaining_time": "8:18:20", "throughput": 2511.5, "total_tokens": 2877248} +{"current_steps": 4960, "total_steps": 134280, "loss": 0.6832, "lr": 1.8465147453083113e-05, "epoch": 0.7387548406315162, "percentage": 3.69, "elapsed_time": "0:19:06", "remaining_time": "8:18:19", "throughput": 2511.51, "total_tokens": 2880128} +{"current_steps": 4965, "total_steps": 134280, "loss": 0.4799, "lr": 1.8483765266607088e-05, "epoch": 0.7394995531724754, "percentage": 3.7, "elapsed_time": "0:19:07", "remaining_time": "8:18:17", "throughput": 2511.45, "total_tokens": 2882944} +{"current_steps": 4970, "total_steps": 134280, "loss": 0.706, "lr": 1.850238308013107e-05, "epoch": 0.7402442657134346, "percentage": 3.7, "elapsed_time": "0:19:09", "remaining_time": "8:18:16", "throughput": 2511.49, "total_tokens": 2885856} +{"current_steps": 4975, "total_steps": 134280, "loss": 0.852, "lr": 1.8521000893655048e-05, "epoch": 0.7409889782543938, "percentage": 3.7, "elapsed_time": "0:19:10", "remaining_time": "8:18:15", "throughput": 2511.48, "total_tokens": 2888768} +{"current_steps": 4980, "total_steps": 134280, "loss": 0.5451, "lr": 1.853961870717903e-05, "epoch": 0.741733690795353, "percentage": 3.71, "elapsed_time": "0:19:11", "remaining_time": "8:18:14", "throughput": 2511.46, "total_tokens": 2891648} +{"current_steps": 4985, "total_steps": 134280, "loss": 0.7736, "lr": 1.855823652070301e-05, "epoch": 0.7424784033363122, "percentage": 3.71, "elapsed_time": "0:19:12", "remaining_time": "8:18:12", "throughput": 2511.45, "total_tokens": 2894464} +{"current_steps": 4990, "total_steps": 134280, "loss": 0.5074, "lr": 1.857685433422699e-05, "epoch": 0.7432231158772714, "percentage": 3.72, "elapsed_time": "0:19:13", "remaining_time": "8:18:09", "throughput": 2511.38, "total_tokens": 2897088} +{"current_steps": 4995, "total_steps": 134280, "loss": 0.6493, "lr": 1.859547214775097e-05, "epoch": 0.7439678284182306, "percentage": 3.72, "elapsed_time": "0:19:14", "remaining_time": "8:18:08", "throughput": 2511.39, "total_tokens": 2900032} +{"current_steps": 5000, "total_steps": 134280, "loss": 0.6536, "lr": 1.861408996127495e-05, "epoch": 0.7447125409591897, "percentage": 3.72, "elapsed_time": "0:19:15", "remaining_time": "8:18:07", "throughput": 2511.38, "total_tokens": 2902944} +{"current_steps": 5005, "total_steps": 134280, "loss": 0.4508, "lr": 1.863270777479893e-05, "epoch": 0.7454572535001489, "percentage": 3.73, "elapsed_time": "0:19:17", "remaining_time": "8:18:06", "throughput": 2511.35, "total_tokens": 2905856} +{"current_steps": 5010, "total_steps": 134280, "loss": 0.7012, "lr": 1.8651325588322906e-05, "epoch": 0.7462019660411081, "percentage": 3.73, "elapsed_time": "0:19:18", "remaining_time": "8:18:03", "throughput": 2511.3, "total_tokens": 2908544} +{"current_steps": 5015, "total_steps": 134280, "loss": 0.6275, "lr": 1.8669943401846887e-05, "epoch": 0.7469466785820673, "percentage": 3.73, "elapsed_time": "0:19:19", "remaining_time": "8:18:04", "throughput": 2511.3, "total_tokens": 2911584} +{"current_steps": 5020, "total_steps": 134280, "loss": 0.6551, "lr": 1.868856121537087e-05, "epoch": 0.7476913911230265, "percentage": 3.74, "elapsed_time": "0:19:20", "remaining_time": "8:18:05", "throughput": 2511.28, "total_tokens": 2914752} +{"current_steps": 5025, "total_steps": 134280, "loss": 0.791, "lr": 1.8707179028894847e-05, "epoch": 0.7484361036639857, "percentage": 3.74, "elapsed_time": "0:19:21", "remaining_time": "8:18:03", "throughput": 2511.21, "total_tokens": 2917472} +{"current_steps": 5030, "total_steps": 134280, "loss": 0.8478, "lr": 1.872579684241883e-05, "epoch": 0.7491808162049449, "percentage": 3.75, "elapsed_time": "0:19:22", "remaining_time": "8:18:01", "throughput": 2511.16, "total_tokens": 2920224} +{"current_steps": 5035, "total_steps": 134280, "loss": 0.5543, "lr": 1.8744414655942807e-05, "epoch": 0.7499255287459041, "percentage": 3.75, "elapsed_time": "0:19:24", "remaining_time": "8:18:00", "throughput": 2511.17, "total_tokens": 2923136} +{"current_steps": 5040, "total_steps": 134280, "loss": 0.5964, "lr": 1.876303246946679e-05, "epoch": 0.7506702412868632, "percentage": 3.75, "elapsed_time": "0:19:25", "remaining_time": "8:18:05", "throughput": 2511.32, "total_tokens": 2926816} +{"current_steps": 5045, "total_steps": 134280, "loss": 0.8146, "lr": 1.8781650282990767e-05, "epoch": 0.7514149538278224, "percentage": 3.76, "elapsed_time": "0:19:26", "remaining_time": "8:18:02", "throughput": 2511.29, "total_tokens": 2929504} +{"current_steps": 5050, "total_steps": 134280, "loss": 0.7004, "lr": 1.8800268096514745e-05, "epoch": 0.7521596663687816, "percentage": 3.76, "elapsed_time": "0:19:27", "remaining_time": "8:18:01", "throughput": 2511.3, "total_tokens": 2932448} +{"current_steps": 5055, "total_steps": 134280, "loss": 0.7807, "lr": 1.8818885910038723e-05, "epoch": 0.7529043789097408, "percentage": 3.76, "elapsed_time": "0:19:28", "remaining_time": "8:18:02", "throughput": 2511.39, "total_tokens": 2935648} +{"current_steps": 5060, "total_steps": 134280, "loss": 0.7709, "lr": 1.8837503723562705e-05, "epoch": 0.7536490914507, "percentage": 3.77, "elapsed_time": "0:19:30", "remaining_time": "8:18:00", "throughput": 2511.39, "total_tokens": 2938496} +{"current_steps": 5065, "total_steps": 134280, "loss": 0.6947, "lr": 1.8856121537086686e-05, "epoch": 0.7543938039916592, "percentage": 3.77, "elapsed_time": "0:19:31", "remaining_time": "8:18:00", "throughput": 2511.41, "total_tokens": 2941536} +{"current_steps": 5070, "total_steps": 134280, "loss": 0.6683, "lr": 1.8874739350610665e-05, "epoch": 0.7551385165326184, "percentage": 3.78, "elapsed_time": "0:19:32", "remaining_time": "8:18:02", "throughput": 2511.41, "total_tokens": 2944736} +{"current_steps": 5075, "total_steps": 134280, "loss": 0.6387, "lr": 1.8893357164134646e-05, "epoch": 0.7558832290735776, "percentage": 3.78, "elapsed_time": "0:19:33", "remaining_time": "8:18:00", "throughput": 2511.37, "total_tokens": 2947552} +{"current_steps": 5080, "total_steps": 134280, "loss": 0.673, "lr": 1.8911974977658625e-05, "epoch": 0.7566279416145368, "percentage": 3.78, "elapsed_time": "0:19:34", "remaining_time": "8:18:00", "throughput": 2511.44, "total_tokens": 2950592} +{"current_steps": 5085, "total_steps": 134280, "loss": 0.7629, "lr": 1.8930592791182606e-05, "epoch": 0.7573726541554959, "percentage": 3.79, "elapsed_time": "0:19:35", "remaining_time": "8:17:58", "throughput": 2511.45, "total_tokens": 2953408} +{"current_steps": 5090, "total_steps": 134280, "loss": 0.4689, "lr": 1.8949210604706584e-05, "epoch": 0.7581173666964551, "percentage": 3.79, "elapsed_time": "0:19:37", "remaining_time": "8:17:55", "throughput": 2511.38, "total_tokens": 2956064} +{"current_steps": 5095, "total_steps": 134280, "loss": 0.609, "lr": 1.8967828418230563e-05, "epoch": 0.7588620792374143, "percentage": 3.79, "elapsed_time": "0:19:38", "remaining_time": "8:17:57", "throughput": 2511.45, "total_tokens": 2959392} +{"current_steps": 5100, "total_steps": 134280, "loss": 0.6698, "lr": 1.8986446231754544e-05, "epoch": 0.7596067917783735, "percentage": 3.8, "elapsed_time": "0:19:39", "remaining_time": "8:17:55", "throughput": 2511.45, "total_tokens": 2962240} +{"current_steps": 5105, "total_steps": 134280, "loss": 0.6469, "lr": 1.9005064045278523e-05, "epoch": 0.7603515043193327, "percentage": 3.8, "elapsed_time": "0:19:40", "remaining_time": "8:17:54", "throughput": 2511.49, "total_tokens": 2965152} +{"current_steps": 5110, "total_steps": 134280, "loss": 0.6416, "lr": 1.9023681858802504e-05, "epoch": 0.7610962168602919, "percentage": 3.81, "elapsed_time": "0:19:41", "remaining_time": "8:17:52", "throughput": 2511.52, "total_tokens": 2968064} +{"current_steps": 5115, "total_steps": 134280, "loss": 0.6257, "lr": 1.9042299672326482e-05, "epoch": 0.7618409294012511, "percentage": 3.81, "elapsed_time": "0:19:42", "remaining_time": "8:17:50", "throughput": 2511.43, "total_tokens": 2970752} +{"current_steps": 5120, "total_steps": 134280, "loss": 0.6287, "lr": 1.9060917485850464e-05, "epoch": 0.7625856419422103, "percentage": 3.81, "elapsed_time": "0:19:44", "remaining_time": "8:17:49", "throughput": 2511.46, "total_tokens": 2973664} +{"current_steps": 5125, "total_steps": 134280, "loss": 0.8084, "lr": 1.9079535299374442e-05, "epoch": 0.7633303544831695, "percentage": 3.82, "elapsed_time": "0:19:45", "remaining_time": "8:17:49", "throughput": 2511.47, "total_tokens": 2976704} +{"current_steps": 5130, "total_steps": 134280, "loss": 0.5751, "lr": 1.9098153112898424e-05, "epoch": 0.7640750670241286, "percentage": 3.82, "elapsed_time": "0:19:46", "remaining_time": "8:17:48", "throughput": 2511.52, "total_tokens": 2979680} +{"current_steps": 5135, "total_steps": 134280, "loss": 0.6105, "lr": 1.9116770926422402e-05, "epoch": 0.7648197795650878, "percentage": 3.82, "elapsed_time": "0:19:47", "remaining_time": "8:17:45", "throughput": 2511.52, "total_tokens": 2982464} +{"current_steps": 5140, "total_steps": 134280, "loss": 0.4923, "lr": 1.913538873994638e-05, "epoch": 0.765564492106047, "percentage": 3.83, "elapsed_time": "0:19:48", "remaining_time": "8:17:43", "throughput": 2511.48, "total_tokens": 2985216} +{"current_steps": 5145, "total_steps": 134280, "loss": 0.8103, "lr": 1.9154006553470362e-05, "epoch": 0.7663092046470062, "percentage": 3.83, "elapsed_time": "0:19:49", "remaining_time": "8:17:41", "throughput": 2511.47, "total_tokens": 2988000} +{"current_steps": 5150, "total_steps": 134280, "loss": 0.6222, "lr": 1.917262436699434e-05, "epoch": 0.7670539171879655, "percentage": 3.84, "elapsed_time": "0:19:50", "remaining_time": "8:17:39", "throughput": 2511.42, "total_tokens": 2990752} +{"current_steps": 5155, "total_steps": 134280, "loss": 0.6457, "lr": 1.9191242180518322e-05, "epoch": 0.7677986297289247, "percentage": 3.84, "elapsed_time": "0:19:51", "remaining_time": "8:17:37", "throughput": 2511.47, "total_tokens": 2993664} +{"current_steps": 5160, "total_steps": 134280, "loss": 0.6137, "lr": 1.92098599940423e-05, "epoch": 0.7685433422698839, "percentage": 3.84, "elapsed_time": "0:19:53", "remaining_time": "8:17:35", "throughput": 2511.45, "total_tokens": 2996480} +{"current_steps": 5165, "total_steps": 134280, "loss": 0.8483, "lr": 1.922847780756628e-05, "epoch": 0.7692880548108431, "percentage": 3.85, "elapsed_time": "0:19:54", "remaining_time": "8:17:35", "throughput": 2511.47, "total_tokens": 2999520} +{"current_steps": 5170, "total_steps": 134280, "loss": 0.6878, "lr": 1.924709562109026e-05, "epoch": 0.7700327673518021, "percentage": 3.85, "elapsed_time": "0:19:55", "remaining_time": "8:17:35", "throughput": 2511.47, "total_tokens": 3002496} +{"current_steps": 5175, "total_steps": 134280, "loss": 0.5819, "lr": 1.926571343461424e-05, "epoch": 0.7707774798927614, "percentage": 3.85, "elapsed_time": "0:19:56", "remaining_time": "8:17:33", "throughput": 2511.45, "total_tokens": 3005312} +{"current_steps": 5180, "total_steps": 134280, "loss": 0.6861, "lr": 1.928433124813822e-05, "epoch": 0.7715221924337206, "percentage": 3.86, "elapsed_time": "0:19:57", "remaining_time": "8:17:31", "throughput": 2511.43, "total_tokens": 3008128} +{"current_steps": 5185, "total_steps": 134280, "loss": 0.6601, "lr": 1.9302949061662198e-05, "epoch": 0.7722669049746798, "percentage": 3.86, "elapsed_time": "0:19:58", "remaining_time": "8:17:31", "throughput": 2511.44, "total_tokens": 3011072} +{"current_steps": 5190, "total_steps": 134280, "loss": 0.7444, "lr": 1.932156687518618e-05, "epoch": 0.773011617515639, "percentage": 3.87, "elapsed_time": "0:20:00", "remaining_time": "8:17:31", "throughput": 2511.55, "total_tokens": 3014272} +{"current_steps": 5195, "total_steps": 134280, "loss": 0.5924, "lr": 1.9340184688710158e-05, "epoch": 0.7737563300565982, "percentage": 3.87, "elapsed_time": "0:20:01", "remaining_time": "8:17:30", "throughput": 2511.57, "total_tokens": 3017248} +{"current_steps": 5200, "total_steps": 134280, "loss": 0.6774, "lr": 1.935880250223414e-05, "epoch": 0.7745010425975574, "percentage": 3.87, "elapsed_time": "0:20:02", "remaining_time": "8:17:29", "throughput": 2511.58, "total_tokens": 3020160} +{"current_steps": 5205, "total_steps": 134280, "loss": 0.7079, "lr": 1.9377420315758118e-05, "epoch": 0.7752457551385166, "percentage": 3.88, "elapsed_time": "0:20:03", "remaining_time": "8:17:29", "throughput": 2511.6, "total_tokens": 3023200} +{"current_steps": 5210, "total_steps": 134280, "loss": 0.5338, "lr": 1.93960381292821e-05, "epoch": 0.7759904676794758, "percentage": 3.88, "elapsed_time": "0:20:04", "remaining_time": "8:17:28", "throughput": 2511.67, "total_tokens": 3026240} +{"current_steps": 5215, "total_steps": 134280, "loss": 0.6385, "lr": 1.9414655942806077e-05, "epoch": 0.7767351802204349, "percentage": 3.88, "elapsed_time": "0:20:05", "remaining_time": "8:17:26", "throughput": 2511.61, "total_tokens": 3028928} +{"current_steps": 5220, "total_steps": 134280, "loss": 0.7483, "lr": 1.943327375633006e-05, "epoch": 0.7774798927613941, "percentage": 3.89, "elapsed_time": "0:20:07", "remaining_time": "8:17:25", "throughput": 2511.59, "total_tokens": 3031808} +{"current_steps": 5225, "total_steps": 134280, "loss": 0.75, "lr": 1.9451891569854037e-05, "epoch": 0.7782246053023533, "percentage": 3.89, "elapsed_time": "0:20:08", "remaining_time": "8:17:23", "throughput": 2511.59, "total_tokens": 3034656} +{"current_steps": 5230, "total_steps": 134280, "loss": 0.7225, "lr": 1.9470509383378016e-05, "epoch": 0.7789693178433125, "percentage": 3.89, "elapsed_time": "0:20:09", "remaining_time": "8:17:24", "throughput": 2511.61, "total_tokens": 3037760} +{"current_steps": 5235, "total_steps": 134280, "loss": 0.6584, "lr": 1.9489127196901997e-05, "epoch": 0.7797140303842717, "percentage": 3.9, "elapsed_time": "0:20:10", "remaining_time": "8:17:23", "throughput": 2511.6, "total_tokens": 3040672} +{"current_steps": 5240, "total_steps": 134280, "loss": 0.6752, "lr": 1.9507745010425975e-05, "epoch": 0.7804587429252309, "percentage": 3.9, "elapsed_time": "0:20:11", "remaining_time": "8:17:21", "throughput": 2511.59, "total_tokens": 3043552} +{"current_steps": 5245, "total_steps": 134280, "loss": 0.6934, "lr": 1.9526362823949957e-05, "epoch": 0.7812034554661901, "percentage": 3.91, "elapsed_time": "0:20:13", "remaining_time": "8:17:24", "throughput": 2511.63, "total_tokens": 3046944} +{"current_steps": 5250, "total_steps": 134280, "loss": 0.6397, "lr": 1.9544980637473935e-05, "epoch": 0.7819481680071493, "percentage": 3.91, "elapsed_time": "0:20:14", "remaining_time": "8:17:24", "throughput": 2511.66, "total_tokens": 3049952} +{"current_steps": 5255, "total_steps": 134280, "loss": 0.6743, "lr": 1.9563598450997917e-05, "epoch": 0.7826928805481085, "percentage": 3.91, "elapsed_time": "0:20:15", "remaining_time": "8:17:21", "throughput": 2511.6, "total_tokens": 3052576} +{"current_steps": 5260, "total_steps": 134280, "loss": 0.5849, "lr": 1.9582216264521895e-05, "epoch": 0.7834375930890676, "percentage": 3.92, "elapsed_time": "0:20:16", "remaining_time": "8:17:21", "throughput": 2511.55, "total_tokens": 3055520} +{"current_steps": 5265, "total_steps": 134280, "loss": 0.731, "lr": 1.9600834078045877e-05, "epoch": 0.7841823056300268, "percentage": 3.92, "elapsed_time": "0:20:17", "remaining_time": "8:17:17", "throughput": 2511.48, "total_tokens": 3058112} +{"current_steps": 5270, "total_steps": 134280, "loss": 0.5914, "lr": 1.9619451891569855e-05, "epoch": 0.784927018170986, "percentage": 3.92, "elapsed_time": "0:20:18", "remaining_time": "8:17:16", "throughput": 2511.52, "total_tokens": 3061024} +{"current_steps": 5275, "total_steps": 134280, "loss": 0.6728, "lr": 1.9638069705093833e-05, "epoch": 0.7856717307119452, "percentage": 3.93, "elapsed_time": "0:20:20", "remaining_time": "8:17:16", "throughput": 2511.56, "total_tokens": 3064160} +{"current_steps": 5280, "total_steps": 134280, "loss": 0.5811, "lr": 1.9656687518617815e-05, "epoch": 0.7864164432529044, "percentage": 3.93, "elapsed_time": "0:20:21", "remaining_time": "8:17:14", "throughput": 2511.54, "total_tokens": 3066912} +{"current_steps": 5285, "total_steps": 134280, "loss": 0.5347, "lr": 1.9675305332141793e-05, "epoch": 0.7871611557938636, "percentage": 3.94, "elapsed_time": "0:20:22", "remaining_time": "8:17:13", "throughput": 2511.57, "total_tokens": 3069856} +{"current_steps": 5290, "total_steps": 134280, "loss": 0.6032, "lr": 1.9693923145665775e-05, "epoch": 0.7879058683348228, "percentage": 3.94, "elapsed_time": "0:20:23", "remaining_time": "8:17:10", "throughput": 2511.48, "total_tokens": 3072448} +{"current_steps": 5295, "total_steps": 134280, "loss": 0.8745, "lr": 1.9712540959189753e-05, "epoch": 0.788650580875782, "percentage": 3.94, "elapsed_time": "0:20:24", "remaining_time": "8:17:09", "throughput": 2511.49, "total_tokens": 3075392} +{"current_steps": 5300, "total_steps": 134280, "loss": 0.7794, "lr": 1.9731158772713735e-05, "epoch": 0.7893952934167411, "percentage": 3.95, "elapsed_time": "0:20:25", "remaining_time": "8:17:07", "throughput": 2511.46, "total_tokens": 3078176} +{"current_steps": 5305, "total_steps": 134280, "loss": 0.699, "lr": 1.9749776586237713e-05, "epoch": 0.7901400059577003, "percentage": 3.95, "elapsed_time": "0:20:26", "remaining_time": "8:17:05", "throughput": 2511.47, "total_tokens": 3081024} +{"current_steps": 5310, "total_steps": 134280, "loss": 0.594, "lr": 1.976839439976169e-05, "epoch": 0.7908847184986595, "percentage": 3.95, "elapsed_time": "0:20:27", "remaining_time": "8:17:04", "throughput": 2511.42, "total_tokens": 3083840} +{"current_steps": 5315, "total_steps": 134280, "loss": 0.648, "lr": 1.9787012213285673e-05, "epoch": 0.7916294310396187, "percentage": 3.96, "elapsed_time": "0:20:29", "remaining_time": "8:17:01", "throughput": 2511.39, "total_tokens": 3086560} +{"current_steps": 5320, "total_steps": 134280, "loss": 0.6876, "lr": 1.980563002680965e-05, "epoch": 0.7923741435805779, "percentage": 3.96, "elapsed_time": "0:20:30", "remaining_time": "8:16:59", "throughput": 2511.41, "total_tokens": 3089440} +{"current_steps": 5325, "total_steps": 134280, "loss": 0.5284, "lr": 1.9824247840333632e-05, "epoch": 0.7931188561215371, "percentage": 3.97, "elapsed_time": "0:20:31", "remaining_time": "8:16:57", "throughput": 2511.39, "total_tokens": 3092192} +{"current_steps": 5330, "total_steps": 134280, "loss": 0.6215, "lr": 1.984286565385761e-05, "epoch": 0.7938635686624963, "percentage": 3.97, "elapsed_time": "0:20:32", "remaining_time": "8:16:57", "throughput": 2511.46, "total_tokens": 3095264} +{"current_steps": 5335, "total_steps": 134280, "loss": 0.5973, "lr": 1.9861483467381592e-05, "epoch": 0.7946082812034555, "percentage": 3.97, "elapsed_time": "0:20:33", "remaining_time": "8:16:57", "throughput": 2511.43, "total_tokens": 3098272} +{"current_steps": 5340, "total_steps": 134280, "loss": 0.7475, "lr": 1.988010128090557e-05, "epoch": 0.7953529937444147, "percentage": 3.98, "elapsed_time": "0:20:34", "remaining_time": "8:16:56", "throughput": 2511.44, "total_tokens": 3101216} +{"current_steps": 5345, "total_steps": 134280, "loss": 0.6288, "lr": 1.9898719094429552e-05, "epoch": 0.7960977062853738, "percentage": 3.98, "elapsed_time": "0:20:35", "remaining_time": "8:16:54", "throughput": 2511.39, "total_tokens": 3104032} +{"current_steps": 5350, "total_steps": 134280, "loss": 0.7673, "lr": 1.9917336907953534e-05, "epoch": 0.796842418826333, "percentage": 3.98, "elapsed_time": "0:20:37", "remaining_time": "8:16:52", "throughput": 2511.38, "total_tokens": 3106784} +{"current_steps": 5355, "total_steps": 134280, "loss": 0.742, "lr": 1.993595472147751e-05, "epoch": 0.7975871313672922, "percentage": 3.99, "elapsed_time": "0:20:38", "remaining_time": "8:16:49", "throughput": 2511.31, "total_tokens": 3109440} +{"current_steps": 5360, "total_steps": 134280, "loss": 0.6396, "lr": 1.995457253500149e-05, "epoch": 0.7983318439082514, "percentage": 3.99, "elapsed_time": "0:20:39", "remaining_time": "8:16:48", "throughput": 2511.37, "total_tokens": 3112448} +{"current_steps": 5365, "total_steps": 134280, "loss": 0.5642, "lr": 1.997319034852547e-05, "epoch": 0.7990765564492106, "percentage": 4.0, "elapsed_time": "0:20:40", "remaining_time": "8:16:47", "throughput": 2511.32, "total_tokens": 3115264} +{"current_steps": 5370, "total_steps": 134280, "loss": 0.6355, "lr": 1.999180816204945e-05, "epoch": 0.7998212689901698, "percentage": 4.0, "elapsed_time": "0:20:41", "remaining_time": "8:16:45", "throughput": 2511.31, "total_tokens": 3118016} +{"current_steps": 5375, "total_steps": 134280, "loss": 0.5918, "lr": 2.001042597557343e-05, "epoch": 0.800565981531129, "percentage": 4.0, "elapsed_time": "0:20:42", "remaining_time": "8:16:44", "throughput": 2511.34, "total_tokens": 3121056} +{"current_steps": 5380, "total_steps": 134280, "loss": 0.6208, "lr": 2.002904378909741e-05, "epoch": 0.8013106940720882, "percentage": 4.01, "elapsed_time": "0:20:43", "remaining_time": "8:16:43", "throughput": 2511.37, "total_tokens": 3123936} +{"current_steps": 5385, "total_steps": 134280, "loss": 0.8782, "lr": 2.0047661602621388e-05, "epoch": 0.8020554066130474, "percentage": 4.01, "elapsed_time": "0:20:45", "remaining_time": "8:16:41", "throughput": 2511.39, "total_tokens": 3126816} +{"current_steps": 5390, "total_steps": 134280, "loss": 0.5842, "lr": 2.006627941614537e-05, "epoch": 0.8028001191540065, "percentage": 4.01, "elapsed_time": "0:20:46", "remaining_time": "8:16:40", "throughput": 2511.42, "total_tokens": 3129792} +{"current_steps": 5395, "total_steps": 134280, "loss": 0.729, "lr": 2.008489722966935e-05, "epoch": 0.8035448316949657, "percentage": 4.02, "elapsed_time": "0:20:47", "remaining_time": "8:16:40", "throughput": 2511.46, "total_tokens": 3132832} +{"current_steps": 5400, "total_steps": 134280, "loss": 0.7065, "lr": 2.0103515043193326e-05, "epoch": 0.8042895442359249, "percentage": 4.02, "elapsed_time": "0:20:48", "remaining_time": "8:16:40", "throughput": 2511.5, "total_tokens": 3135968} +{"current_steps": 5405, "total_steps": 134280, "loss": 0.8606, "lr": 2.0122132856717308e-05, "epoch": 0.8050342567768841, "percentage": 4.03, "elapsed_time": "0:20:49", "remaining_time": "8:16:38", "throughput": 2511.5, "total_tokens": 3138752} +{"current_steps": 5410, "total_steps": 134280, "loss": 0.6785, "lr": 2.0140750670241286e-05, "epoch": 0.8057789693178433, "percentage": 4.03, "elapsed_time": "0:20:50", "remaining_time": "8:16:37", "throughput": 2511.51, "total_tokens": 3141696} +{"current_steps": 5415, "total_steps": 134280, "loss": 0.539, "lr": 2.0159368483765268e-05, "epoch": 0.8065236818588025, "percentage": 4.03, "elapsed_time": "0:20:52", "remaining_time": "8:16:35", "throughput": 2511.42, "total_tokens": 3144352} +{"current_steps": 5420, "total_steps": 134280, "loss": 0.6995, "lr": 2.0177986297289246e-05, "epoch": 0.8072683943997617, "percentage": 4.04, "elapsed_time": "0:20:53", "remaining_time": "8:16:33", "throughput": 2511.34, "total_tokens": 3147040} +{"current_steps": 5425, "total_steps": 134280, "loss": 0.8315, "lr": 2.0196604110813228e-05, "epoch": 0.8080131069407209, "percentage": 4.04, "elapsed_time": "0:20:54", "remaining_time": "8:16:32", "throughput": 2511.38, "total_tokens": 3150080} +{"current_steps": 5430, "total_steps": 134280, "loss": 0.5055, "lr": 2.021522192433721e-05, "epoch": 0.80875781948168, "percentage": 4.04, "elapsed_time": "0:20:55", "remaining_time": "8:16:31", "throughput": 2511.42, "total_tokens": 3152992} +{"current_steps": 5435, "total_steps": 134280, "loss": 0.8085, "lr": 2.0233839737861187e-05, "epoch": 0.8095025320226392, "percentage": 4.05, "elapsed_time": "0:20:56", "remaining_time": "8:16:30", "throughput": 2511.4, "total_tokens": 3155936} +{"current_steps": 5440, "total_steps": 134280, "loss": 0.5796, "lr": 2.0252457551385166e-05, "epoch": 0.8102472445635984, "percentage": 4.05, "elapsed_time": "0:20:57", "remaining_time": "8:16:29", "throughput": 2511.43, "total_tokens": 3158912} +{"current_steps": 5445, "total_steps": 134280, "loss": 0.6783, "lr": 2.0271075364909144e-05, "epoch": 0.8109919571045576, "percentage": 4.05, "elapsed_time": "0:20:59", "remaining_time": "8:16:29", "throughput": 2511.43, "total_tokens": 3161920} +{"current_steps": 5450, "total_steps": 134280, "loss": 0.694, "lr": 2.0289693178433126e-05, "epoch": 0.8117366696455168, "percentage": 4.06, "elapsed_time": "0:21:00", "remaining_time": "8:16:31", "throughput": 2511.49, "total_tokens": 3165184} +{"current_steps": 5455, "total_steps": 134280, "loss": 0.6686, "lr": 2.0308310991957104e-05, "epoch": 0.812481382186476, "percentage": 4.06, "elapsed_time": "0:21:01", "remaining_time": "8:16:32", "throughput": 2511.61, "total_tokens": 3168512} +{"current_steps": 5460, "total_steps": 134280, "loss": 0.5766, "lr": 2.0326928805481085e-05, "epoch": 0.8132260947274352, "percentage": 4.07, "elapsed_time": "0:21:02", "remaining_time": "8:16:29", "throughput": 2511.57, "total_tokens": 3171168} +{"current_steps": 5465, "total_steps": 134280, "loss": 0.6602, "lr": 2.0345546619005064e-05, "epoch": 0.8139708072683944, "percentage": 4.07, "elapsed_time": "0:21:03", "remaining_time": "8:16:27", "throughput": 2511.5, "total_tokens": 3173888} +{"current_steps": 5470, "total_steps": 134280, "loss": 0.8173, "lr": 2.0364164432529045e-05, "epoch": 0.8147155198093536, "percentage": 4.07, "elapsed_time": "0:21:04", "remaining_time": "8:16:26", "throughput": 2511.5, "total_tokens": 3176800} +{"current_steps": 5475, "total_steps": 134280, "loss": 0.6154, "lr": 2.0382782246053027e-05, "epoch": 0.8154602323503127, "percentage": 4.08, "elapsed_time": "0:21:06", "remaining_time": "8:16:24", "throughput": 2511.46, "total_tokens": 3179552} +{"current_steps": 5480, "total_steps": 134280, "loss": 0.7969, "lr": 2.0401400059577005e-05, "epoch": 0.8162049448912719, "percentage": 4.08, "elapsed_time": "0:21:07", "remaining_time": "8:16:22", "throughput": 2511.46, "total_tokens": 3182400} +{"current_steps": 5485, "total_steps": 134280, "loss": 0.7698, "lr": 2.0420017873100983e-05, "epoch": 0.8169496574322311, "percentage": 4.08, "elapsed_time": "0:21:08", "remaining_time": "8:16:21", "throughput": 2511.47, "total_tokens": 3185280} +{"current_steps": 5490, "total_steps": 134280, "loss": 0.5247, "lr": 2.043863568662496e-05, "epoch": 0.8176943699731903, "percentage": 4.09, "elapsed_time": "0:21:09", "remaining_time": "8:16:20", "throughput": 2511.43, "total_tokens": 3188128} +{"current_steps": 5495, "total_steps": 134280, "loss": 0.5978, "lr": 2.0457253500148943e-05, "epoch": 0.8184390825141495, "percentage": 4.09, "elapsed_time": "0:21:10", "remaining_time": "8:16:19", "throughput": 2511.39, "total_tokens": 3191072} +{"current_steps": 5500, "total_steps": 134280, "loss": 0.6518, "lr": 2.047587131367292e-05, "epoch": 0.8191837950551087, "percentage": 4.1, "elapsed_time": "0:21:11", "remaining_time": "8:16:20", "throughput": 2511.47, "total_tokens": 3194272} +{"current_steps": 5505, "total_steps": 134280, "loss": 0.7665, "lr": 2.0494489127196903e-05, "epoch": 0.819928507596068, "percentage": 4.1, "elapsed_time": "0:21:12", "remaining_time": "8:16:17", "throughput": 2511.46, "total_tokens": 3196992} +{"current_steps": 5510, "total_steps": 134280, "loss": 0.5986, "lr": 2.0513106940720885e-05, "epoch": 0.8206732201370271, "percentage": 4.1, "elapsed_time": "0:21:14", "remaining_time": "8:16:17", "throughput": 2511.52, "total_tokens": 3200096} +{"current_steps": 5515, "total_steps": 134280, "loss": 0.7196, "lr": 2.0531724754244863e-05, "epoch": 0.8214179326779864, "percentage": 4.11, "elapsed_time": "0:21:15", "remaining_time": "8:16:17", "throughput": 2511.52, "total_tokens": 3203104} +{"current_steps": 5520, "total_steps": 134280, "loss": 0.6772, "lr": 2.0550342567768845e-05, "epoch": 0.8221626452189454, "percentage": 4.11, "elapsed_time": "0:21:16", "remaining_time": "8:16:14", "throughput": 2511.43, "total_tokens": 3205728} +{"current_steps": 5525, "total_steps": 134280, "loss": 0.5544, "lr": 2.0568960381292823e-05, "epoch": 0.8229073577599046, "percentage": 4.11, "elapsed_time": "0:21:17", "remaining_time": "8:16:11", "throughput": 2511.32, "total_tokens": 3208320} +{"current_steps": 5530, "total_steps": 134280, "loss": 0.7325, "lr": 2.05875781948168e-05, "epoch": 0.8236520703008638, "percentage": 4.12, "elapsed_time": "0:21:18", "remaining_time": "8:16:09", "throughput": 2511.3, "total_tokens": 3211072} +{"current_steps": 5535, "total_steps": 134280, "loss": 0.6469, "lr": 2.060619600834078e-05, "epoch": 0.824396782841823, "percentage": 4.12, "elapsed_time": "0:21:19", "remaining_time": "8:16:09", "throughput": 2511.34, "total_tokens": 3214144} +{"current_steps": 5540, "total_steps": 134280, "loss": 0.7574, "lr": 2.062481382186476e-05, "epoch": 0.8251414953827823, "percentage": 4.13, "elapsed_time": "0:21:20", "remaining_time": "8:16:07", "throughput": 2511.34, "total_tokens": 3216992} +{"current_steps": 5545, "total_steps": 134280, "loss": 0.7546, "lr": 2.0643431635388742e-05, "epoch": 0.8258862079237415, "percentage": 4.13, "elapsed_time": "0:21:22", "remaining_time": "8:16:07", "throughput": 2511.38, "total_tokens": 3220064} +{"current_steps": 5550, "total_steps": 134280, "loss": 0.4633, "lr": 2.066204944891272e-05, "epoch": 0.8266309204647007, "percentage": 4.13, "elapsed_time": "0:21:23", "remaining_time": "8:16:06", "throughput": 2511.35, "total_tokens": 3222880} +{"current_steps": 5555, "total_steps": 134280, "loss": 0.6306, "lr": 2.0680667262436702e-05, "epoch": 0.8273756330056599, "percentage": 4.14, "elapsed_time": "0:21:24", "remaining_time": "8:16:05", "throughput": 2511.43, "total_tokens": 3225952} +{"current_steps": 5560, "total_steps": 134280, "loss": 0.8442, "lr": 2.069928507596068e-05, "epoch": 0.828120345546619, "percentage": 4.14, "elapsed_time": "0:21:25", "remaining_time": "8:16:03", "throughput": 2511.37, "total_tokens": 3228672} +{"current_steps": 5565, "total_steps": 134280, "loss": 0.6217, "lr": 2.0717902889484662e-05, "epoch": 0.8288650580875782, "percentage": 4.14, "elapsed_time": "0:21:26", "remaining_time": "8:16:01", "throughput": 2511.33, "total_tokens": 3231392} +{"current_steps": 5570, "total_steps": 134280, "loss": 0.6113, "lr": 2.0736520703008637e-05, "epoch": 0.8296097706285374, "percentage": 4.15, "elapsed_time": "0:21:27", "remaining_time": "8:15:59", "throughput": 2511.32, "total_tokens": 3234272} +{"current_steps": 5575, "total_steps": 134280, "loss": 0.7404, "lr": 2.075513851653262e-05, "epoch": 0.8303544831694966, "percentage": 4.15, "elapsed_time": "0:21:29", "remaining_time": "8:15:58", "throughput": 2511.28, "total_tokens": 3237056} +{"current_steps": 5580, "total_steps": 134280, "loss": 0.6061, "lr": 2.0773756330056597e-05, "epoch": 0.8310991957104558, "percentage": 4.16, "elapsed_time": "0:21:30", "remaining_time": "8:15:57", "throughput": 2511.34, "total_tokens": 3240064} +{"current_steps": 5585, "total_steps": 134280, "loss": 0.6918, "lr": 2.079237414358058e-05, "epoch": 0.831843908251415, "percentage": 4.16, "elapsed_time": "0:21:31", "remaining_time": "8:15:56", "throughput": 2511.39, "total_tokens": 3243072} +{"current_steps": 5590, "total_steps": 134280, "loss": 0.7187, "lr": 2.081099195710456e-05, "epoch": 0.8325886207923742, "percentage": 4.16, "elapsed_time": "0:21:32", "remaining_time": "8:15:54", "throughput": 2511.39, "total_tokens": 3245920} +{"current_steps": 5595, "total_steps": 134280, "loss": 0.71, "lr": 2.082960977062854e-05, "epoch": 0.8333333333333334, "percentage": 4.17, "elapsed_time": "0:21:33", "remaining_time": "8:15:56", "throughput": 2511.48, "total_tokens": 3249280} +{"current_steps": 5600, "total_steps": 134280, "loss": 0.6093, "lr": 2.084822758415252e-05, "epoch": 0.8340780458742926, "percentage": 4.17, "elapsed_time": "0:21:34", "remaining_time": "8:15:56", "throughput": 2511.54, "total_tokens": 3252320} +{"current_steps": 5605, "total_steps": 134280, "loss": 0.6249, "lr": 2.0866845397676498e-05, "epoch": 0.8348227584152517, "percentage": 4.17, "elapsed_time": "0:21:36", "remaining_time": "8:15:57", "throughput": 2511.54, "total_tokens": 3255456} +{"current_steps": 5610, "total_steps": 134280, "loss": 0.6749, "lr": 2.088546321120048e-05, "epoch": 0.8355674709562109, "percentage": 4.18, "elapsed_time": "0:21:37", "remaining_time": "8:15:54", "throughput": 2511.52, "total_tokens": 3258144} +{"current_steps": 5615, "total_steps": 134280, "loss": 0.7227, "lr": 2.0904081024724455e-05, "epoch": 0.8363121834971701, "percentage": 4.18, "elapsed_time": "0:21:38", "remaining_time": "8:15:51", "throughput": 2511.5, "total_tokens": 3260832} +{"current_steps": 5620, "total_steps": 134280, "loss": 0.7272, "lr": 2.0922698838248436e-05, "epoch": 0.8370568960381293, "percentage": 4.19, "elapsed_time": "0:21:39", "remaining_time": "8:15:49", "throughput": 2511.51, "total_tokens": 3263712} +{"current_steps": 5625, "total_steps": 134280, "loss": 0.6762, "lr": 2.0941316651772418e-05, "epoch": 0.8378016085790885, "percentage": 4.19, "elapsed_time": "0:21:40", "remaining_time": "8:15:48", "throughput": 2511.55, "total_tokens": 3266688} +{"current_steps": 5630, "total_steps": 134280, "loss": 0.7984, "lr": 2.0959934465296396e-05, "epoch": 0.8385463211200477, "percentage": 4.19, "elapsed_time": "0:21:41", "remaining_time": "8:15:46", "throughput": 2511.54, "total_tokens": 3269504} +{"current_steps": 5635, "total_steps": 134280, "loss": 0.5116, "lr": 2.0978552278820378e-05, "epoch": 0.8392910336610069, "percentage": 4.2, "elapsed_time": "0:21:42", "remaining_time": "8:15:46", "throughput": 2511.61, "total_tokens": 3272608} +{"current_steps": 5640, "total_steps": 134280, "loss": 0.5714, "lr": 2.0997170092344356e-05, "epoch": 0.8400357462019661, "percentage": 4.2, "elapsed_time": "0:21:44", "remaining_time": "8:15:46", "throughput": 2511.61, "total_tokens": 3275584} +{"current_steps": 5645, "total_steps": 134280, "loss": 0.5671, "lr": 2.1015787905868338e-05, "epoch": 0.8407804587429253, "percentage": 4.2, "elapsed_time": "0:21:45", "remaining_time": "8:15:44", "throughput": 2511.57, "total_tokens": 3278368} +{"current_steps": 5650, "total_steps": 134280, "loss": 0.7249, "lr": 2.1034405719392316e-05, "epoch": 0.8415251712838844, "percentage": 4.21, "elapsed_time": "0:21:46", "remaining_time": "8:15:43", "throughput": 2511.61, "total_tokens": 3281312} +{"current_steps": 5655, "total_steps": 134280, "loss": 0.5391, "lr": 2.1053023532916297e-05, "epoch": 0.8422698838248436, "percentage": 4.21, "elapsed_time": "0:21:47", "remaining_time": "8:15:41", "throughput": 2511.61, "total_tokens": 3284128} +{"current_steps": 5660, "total_steps": 134280, "loss": 0.6088, "lr": 2.1071641346440272e-05, "epoch": 0.8430145963658028, "percentage": 4.22, "elapsed_time": "0:21:48", "remaining_time": "8:15:38", "throughput": 2511.56, "total_tokens": 3286816} +{"current_steps": 5665, "total_steps": 134280, "loss": 0.5777, "lr": 2.1090259159964254e-05, "epoch": 0.843759308906762, "percentage": 4.22, "elapsed_time": "0:21:49", "remaining_time": "8:15:37", "throughput": 2511.65, "total_tokens": 3289824} +{"current_steps": 5670, "total_steps": 134280, "loss": 0.5642, "lr": 2.1108876973488236e-05, "epoch": 0.8445040214477212, "percentage": 4.22, "elapsed_time": "0:21:51", "remaining_time": "8:15:38", "throughput": 2511.76, "total_tokens": 3293152} +{"current_steps": 5675, "total_steps": 134280, "loss": 0.6739, "lr": 2.1127494787012214e-05, "epoch": 0.8452487339886804, "percentage": 4.23, "elapsed_time": "0:21:52", "remaining_time": "8:15:37", "throughput": 2511.74, "total_tokens": 3295968} +{"current_steps": 5680, "total_steps": 134280, "loss": 0.7355, "lr": 2.1146112600536195e-05, "epoch": 0.8459934465296396, "percentage": 4.23, "elapsed_time": "0:21:53", "remaining_time": "8:15:34", "throughput": 2511.64, "total_tokens": 3298528} +{"current_steps": 5685, "total_steps": 134280, "loss": 0.731, "lr": 2.1164730414060174e-05, "epoch": 0.8467381590705988, "percentage": 4.23, "elapsed_time": "0:21:54", "remaining_time": "8:15:35", "throughput": 2511.65, "total_tokens": 3301696} +{"current_steps": 5690, "total_steps": 134280, "loss": 0.7463, "lr": 2.1183348227584155e-05, "epoch": 0.8474828716115579, "percentage": 4.24, "elapsed_time": "0:21:55", "remaining_time": "8:15:34", "throughput": 2511.66, "total_tokens": 3304672} +{"current_steps": 5695, "total_steps": 134280, "loss": 0.627, "lr": 2.1201966041108133e-05, "epoch": 0.8482275841525171, "percentage": 4.24, "elapsed_time": "0:21:56", "remaining_time": "8:15:30", "throughput": 2511.56, "total_tokens": 3307168} +{"current_steps": 5700, "total_steps": 134280, "loss": 0.6607, "lr": 2.1220583854632112e-05, "epoch": 0.8489722966934763, "percentage": 4.24, "elapsed_time": "0:21:57", "remaining_time": "8:15:29", "throughput": 2511.54, "total_tokens": 3309952} +{"current_steps": 5705, "total_steps": 134280, "loss": 0.7317, "lr": 2.1239201668156093e-05, "epoch": 0.8497170092344355, "percentage": 4.25, "elapsed_time": "0:21:59", "remaining_time": "8:15:27", "throughput": 2511.52, "total_tokens": 3312800} +{"current_steps": 5710, "total_steps": 134280, "loss": 0.6606, "lr": 2.125781948168007e-05, "epoch": 0.8504617217753947, "percentage": 4.25, "elapsed_time": "0:22:00", "remaining_time": "8:15:26", "throughput": 2511.56, "total_tokens": 3315808} +{"current_steps": 5715, "total_steps": 134280, "loss": 0.7426, "lr": 2.1276437295204053e-05, "epoch": 0.8512064343163539, "percentage": 4.26, "elapsed_time": "0:22:01", "remaining_time": "8:15:25", "throughput": 2511.55, "total_tokens": 3318720} +{"current_steps": 5720, "total_steps": 134280, "loss": 0.6908, "lr": 2.129505510872803e-05, "epoch": 0.8519511468573131, "percentage": 4.26, "elapsed_time": "0:22:02", "remaining_time": "8:15:25", "throughput": 2511.56, "total_tokens": 3321728} +{"current_steps": 5725, "total_steps": 134280, "loss": 0.7111, "lr": 2.1313672922252013e-05, "epoch": 0.8526958593982723, "percentage": 4.26, "elapsed_time": "0:22:03", "remaining_time": "8:15:24", "throughput": 2511.55, "total_tokens": 3324640} +{"current_steps": 5730, "total_steps": 134280, "loss": 0.7563, "lr": 2.133229073577599e-05, "epoch": 0.8534405719392315, "percentage": 4.27, "elapsed_time": "0:22:04", "remaining_time": "8:15:23", "throughput": 2511.49, "total_tokens": 3327456} +{"current_steps": 5735, "total_steps": 134280, "loss": 0.6618, "lr": 2.1350908549299973e-05, "epoch": 0.8541852844801906, "percentage": 4.27, "elapsed_time": "0:22:06", "remaining_time": "8:15:23", "throughput": 2511.56, "total_tokens": 3330560} +{"current_steps": 5740, "total_steps": 134280, "loss": 0.7711, "lr": 2.136952636282395e-05, "epoch": 0.8549299970211498, "percentage": 4.27, "elapsed_time": "0:22:07", "remaining_time": "8:15:22", "throughput": 2511.59, "total_tokens": 3333600} +{"current_steps": 5745, "total_steps": 134280, "loss": 0.7042, "lr": 2.138814417634793e-05, "epoch": 0.855674709562109, "percentage": 4.28, "elapsed_time": "0:22:08", "remaining_time": "8:15:24", "throughput": 2511.62, "total_tokens": 3336800} +{"current_steps": 5750, "total_steps": 134280, "loss": 0.5533, "lr": 2.140676198987191e-05, "epoch": 0.8564194221030682, "percentage": 4.28, "elapsed_time": "0:22:09", "remaining_time": "8:15:21", "throughput": 2511.63, "total_tokens": 3339552} +{"current_steps": 5755, "total_steps": 134280, "loss": 0.5803, "lr": 2.142537980339589e-05, "epoch": 0.8571641346440274, "percentage": 4.29, "elapsed_time": "0:22:10", "remaining_time": "8:15:20", "throughput": 2511.71, "total_tokens": 3342624} +{"current_steps": 5760, "total_steps": 134280, "loss": 0.4835, "lr": 2.144399761691987e-05, "epoch": 0.8579088471849866, "percentage": 4.29, "elapsed_time": "0:22:12", "remaining_time": "8:15:22", "throughput": 2511.79, "total_tokens": 3345984} +{"current_steps": 5765, "total_steps": 134280, "loss": 0.5077, "lr": 2.146261543044385e-05, "epoch": 0.8586535597259458, "percentage": 4.29, "elapsed_time": "0:22:13", "remaining_time": "8:15:21", "throughput": 2511.79, "total_tokens": 3348864} +{"current_steps": 5770, "total_steps": 134280, "loss": 0.5176, "lr": 2.148123324396783e-05, "epoch": 0.859398272266905, "percentage": 4.3, "elapsed_time": "0:22:14", "remaining_time": "8:15:19", "throughput": 2511.81, "total_tokens": 3351744} +{"current_steps": 5775, "total_steps": 134280, "loss": 0.7003, "lr": 2.149985105749181e-05, "epoch": 0.8601429848078642, "percentage": 4.3, "elapsed_time": "0:22:15", "remaining_time": "8:15:17", "throughput": 2511.78, "total_tokens": 3354528} +{"current_steps": 5780, "total_steps": 134280, "loss": 0.6692, "lr": 2.151846887101579e-05, "epoch": 0.8608876973488233, "percentage": 4.3, "elapsed_time": "0:22:16", "remaining_time": "8:15:16", "throughput": 2511.77, "total_tokens": 3357376} +{"current_steps": 5785, "total_steps": 134280, "loss": 0.8655, "lr": 2.153708668453977e-05, "epoch": 0.8616324098897825, "percentage": 4.31, "elapsed_time": "0:22:17", "remaining_time": "8:15:14", "throughput": 2511.78, "total_tokens": 3360224} +{"current_steps": 5790, "total_steps": 134280, "loss": 0.5437, "lr": 2.1555704498063747e-05, "epoch": 0.8623771224307417, "percentage": 4.31, "elapsed_time": "0:22:18", "remaining_time": "8:15:11", "throughput": 2511.73, "total_tokens": 3362816} +{"current_steps": 5795, "total_steps": 134280, "loss": 0.7384, "lr": 2.157432231158773e-05, "epoch": 0.8631218349717009, "percentage": 4.32, "elapsed_time": "0:22:19", "remaining_time": "8:15:10", "throughput": 2511.74, "total_tokens": 3365728} +{"current_steps": 5800, "total_steps": 134280, "loss": 0.6481, "lr": 2.1592940125111707e-05, "epoch": 0.8638665475126601, "percentage": 4.32, "elapsed_time": "0:22:21", "remaining_time": "8:15:08", "throughput": 2511.66, "total_tokens": 3368448} +{"current_steps": 5805, "total_steps": 134280, "loss": 0.6728, "lr": 2.161155793863569e-05, "epoch": 0.8646112600536193, "percentage": 4.32, "elapsed_time": "0:22:22", "remaining_time": "8:15:07", "throughput": 2511.62, "total_tokens": 3371392} +{"current_steps": 5810, "total_steps": 134280, "loss": 0.5294, "lr": 2.1630175752159667e-05, "epoch": 0.8653559725945785, "percentage": 4.33, "elapsed_time": "0:22:23", "remaining_time": "8:15:05", "throughput": 2511.51, "total_tokens": 3373952} +{"current_steps": 5815, "total_steps": 134280, "loss": 0.6446, "lr": 2.164879356568365e-05, "epoch": 0.8661006851355377, "percentage": 4.33, "elapsed_time": "0:22:24", "remaining_time": "8:15:02", "throughput": 2511.48, "total_tokens": 3376672} +{"current_steps": 5820, "total_steps": 134280, "loss": 0.8751, "lr": 2.1667411379207627e-05, "epoch": 0.8668453976764968, "percentage": 4.33, "elapsed_time": "0:22:25", "remaining_time": "8:15:03", "throughput": 2511.53, "total_tokens": 3379840} +{"current_steps": 5825, "total_steps": 134280, "loss": 0.5861, "lr": 2.1686029192731608e-05, "epoch": 0.867590110217456, "percentage": 4.34, "elapsed_time": "0:22:26", "remaining_time": "8:15:01", "throughput": 2511.5, "total_tokens": 3382592} +{"current_steps": 5830, "total_steps": 134280, "loss": 0.7713, "lr": 2.1704647006255586e-05, "epoch": 0.8683348227584152, "percentage": 4.34, "elapsed_time": "0:22:27", "remaining_time": "8:14:58", "throughput": 2511.44, "total_tokens": 3385248} +{"current_steps": 5835, "total_steps": 134280, "loss": 0.7095, "lr": 2.1723264819779565e-05, "epoch": 0.8690795352993744, "percentage": 4.35, "elapsed_time": "0:22:29", "remaining_time": "8:14:58", "throughput": 2511.45, "total_tokens": 3388288} +{"current_steps": 5840, "total_steps": 134280, "loss": 0.7318, "lr": 2.1741882633303546e-05, "epoch": 0.8698242478403336, "percentage": 4.35, "elapsed_time": "0:22:30", "remaining_time": "8:14:56", "throughput": 2511.4, "total_tokens": 3391008} +{"current_steps": 5845, "total_steps": 134280, "loss": 0.5848, "lr": 2.1760500446827525e-05, "epoch": 0.8705689603812928, "percentage": 4.35, "elapsed_time": "0:22:31", "remaining_time": "8:14:55", "throughput": 2511.4, "total_tokens": 3393920} +{"current_steps": 5850, "total_steps": 134280, "loss": 0.7681, "lr": 2.1779118260351506e-05, "epoch": 0.871313672922252, "percentage": 4.36, "elapsed_time": "0:22:32", "remaining_time": "8:14:53", "throughput": 2511.37, "total_tokens": 3396768} +{"current_steps": 5855, "total_steps": 134280, "loss": 0.7299, "lr": 2.1797736073875484e-05, "epoch": 0.8720583854632112, "percentage": 4.36, "elapsed_time": "0:22:33", "remaining_time": "8:14:52", "throughput": 2511.36, "total_tokens": 3399680} +{"current_steps": 5860, "total_steps": 134280, "loss": 0.6535, "lr": 2.1816353887399466e-05, "epoch": 0.8728030980041704, "percentage": 4.36, "elapsed_time": "0:22:34", "remaining_time": "8:14:50", "throughput": 2511.4, "total_tokens": 3402528} +{"current_steps": 5865, "total_steps": 134280, "loss": 0.5424, "lr": 2.1834971700923444e-05, "epoch": 0.8735478105451295, "percentage": 4.37, "elapsed_time": "0:22:35", "remaining_time": "8:14:48", "throughput": 2511.37, "total_tokens": 3405248} +{"current_steps": 5870, "total_steps": 134280, "loss": 0.6838, "lr": 2.1853589514447426e-05, "epoch": 0.8742925230860887, "percentage": 4.37, "elapsed_time": "0:22:37", "remaining_time": "8:14:49", "throughput": 2511.42, "total_tokens": 3408448} +{"current_steps": 5875, "total_steps": 134280, "loss": 0.7105, "lr": 2.1872207327971404e-05, "epoch": 0.8750372356270479, "percentage": 4.38, "elapsed_time": "0:22:38", "remaining_time": "8:14:48", "throughput": 2511.47, "total_tokens": 3411520} +{"current_steps": 5880, "total_steps": 134280, "loss": 0.4796, "lr": 2.1890825141495382e-05, "epoch": 0.8757819481680071, "percentage": 4.38, "elapsed_time": "0:22:39", "remaining_time": "8:14:47", "throughput": 2511.55, "total_tokens": 3414528} +{"current_steps": 5885, "total_steps": 134280, "loss": 0.774, "lr": 2.1909442955019364e-05, "epoch": 0.8765266607089663, "percentage": 4.38, "elapsed_time": "0:22:40", "remaining_time": "8:14:45", "throughput": 2511.49, "total_tokens": 3417280} +{"current_steps": 5890, "total_steps": 134280, "loss": 0.5396, "lr": 2.1928060768543342e-05, "epoch": 0.8772713732499255, "percentage": 4.39, "elapsed_time": "0:22:41", "remaining_time": "8:14:46", "throughput": 2511.52, "total_tokens": 3420416} +{"current_steps": 5895, "total_steps": 134280, "loss": 0.5112, "lr": 2.1946678582067324e-05, "epoch": 0.8780160857908847, "percentage": 4.39, "elapsed_time": "0:22:42", "remaining_time": "8:14:43", "throughput": 2511.47, "total_tokens": 3423104} +{"current_steps": 5900, "total_steps": 134280, "loss": 0.5858, "lr": 2.1965296395591302e-05, "epoch": 0.878760798331844, "percentage": 4.39, "elapsed_time": "0:22:44", "remaining_time": "8:14:42", "throughput": 2511.52, "total_tokens": 3426080} +{"current_steps": 5905, "total_steps": 134280, "loss": 0.5647, "lr": 2.1983914209115284e-05, "epoch": 0.8795055108728032, "percentage": 4.4, "elapsed_time": "0:22:45", "remaining_time": "8:14:42", "throughput": 2511.55, "total_tokens": 3429152} +{"current_steps": 5910, "total_steps": 134280, "loss": 0.8932, "lr": 2.2002532022639262e-05, "epoch": 0.8802502234137622, "percentage": 4.4, "elapsed_time": "0:22:46", "remaining_time": "8:14:40", "throughput": 2511.54, "total_tokens": 3431904} +{"current_steps": 5915, "total_steps": 134280, "loss": 0.6134, "lr": 2.202114983616324e-05, "epoch": 0.8809949359547214, "percentage": 4.4, "elapsed_time": "0:22:47", "remaining_time": "8:14:39", "throughput": 2511.57, "total_tokens": 3434880} +{"current_steps": 5920, "total_steps": 134280, "loss": 0.7436, "lr": 2.2039767649687222e-05, "epoch": 0.8817396484956807, "percentage": 4.41, "elapsed_time": "0:22:48", "remaining_time": "8:14:37", "throughput": 2511.58, "total_tokens": 3437728} +{"current_steps": 5925, "total_steps": 134280, "loss": 0.5644, "lr": 2.20583854632112e-05, "epoch": 0.8824843610366399, "percentage": 4.41, "elapsed_time": "0:22:49", "remaining_time": "8:14:36", "throughput": 2511.59, "total_tokens": 3440640} +{"current_steps": 5930, "total_steps": 134280, "loss": 0.7169, "lr": 2.207700327673518e-05, "epoch": 0.883229073577599, "percentage": 4.42, "elapsed_time": "0:22:51", "remaining_time": "8:14:34", "throughput": 2511.6, "total_tokens": 3443488} +{"current_steps": 5935, "total_steps": 134280, "loss": 0.5655, "lr": 2.209562109025916e-05, "epoch": 0.8839737861185583, "percentage": 4.42, "elapsed_time": "0:22:52", "remaining_time": "8:14:32", "throughput": 2511.53, "total_tokens": 3446176} +{"current_steps": 5940, "total_steps": 134280, "loss": 0.6887, "lr": 2.211423890378314e-05, "epoch": 0.8847184986595175, "percentage": 4.42, "elapsed_time": "0:22:53", "remaining_time": "8:14:30", "throughput": 2511.53, "total_tokens": 3448960} +{"current_steps": 5945, "total_steps": 134280, "loss": 0.4369, "lr": 2.213285671730712e-05, "epoch": 0.8854632112004767, "percentage": 4.43, "elapsed_time": "0:22:54", "remaining_time": "8:14:27", "throughput": 2511.51, "total_tokens": 3451648} +{"current_steps": 5950, "total_steps": 134280, "loss": 0.8665, "lr": 2.21514745308311e-05, "epoch": 0.8862079237414358, "percentage": 4.43, "elapsed_time": "0:22:55", "remaining_time": "8:14:25", "throughput": 2511.53, "total_tokens": 3454464} +{"current_steps": 5955, "total_steps": 134280, "loss": 0.6037, "lr": 2.2170092344355083e-05, "epoch": 0.886952636282395, "percentage": 4.43, "elapsed_time": "0:22:56", "remaining_time": "8:14:23", "throughput": 2511.5, "total_tokens": 3457248} +{"current_steps": 5960, "total_steps": 134280, "loss": 0.6106, "lr": 2.2188710157879058e-05, "epoch": 0.8876973488233542, "percentage": 4.44, "elapsed_time": "0:22:57", "remaining_time": "8:14:21", "throughput": 2511.41, "total_tokens": 3459872} +{"current_steps": 5965, "total_steps": 134280, "loss": 0.6191, "lr": 2.220732797140304e-05, "epoch": 0.8884420613643134, "percentage": 4.44, "elapsed_time": "0:22:58", "remaining_time": "8:14:21", "throughput": 2511.38, "total_tokens": 3462880} +{"current_steps": 5970, "total_steps": 134280, "loss": 0.6473, "lr": 2.2225945784927018e-05, "epoch": 0.8891867739052726, "percentage": 4.45, "elapsed_time": "0:23:00", "remaining_time": "8:14:20", "throughput": 2511.39, "total_tokens": 3465792} +{"current_steps": 5975, "total_steps": 134280, "loss": 0.7022, "lr": 2.2244563598451e-05, "epoch": 0.8899314864462318, "percentage": 4.45, "elapsed_time": "0:23:01", "remaining_time": "8:14:18", "throughput": 2511.38, "total_tokens": 3468608} +{"current_steps": 5980, "total_steps": 134280, "loss": 0.6365, "lr": 2.2263181411974977e-05, "epoch": 0.890676198987191, "percentage": 4.45, "elapsed_time": "0:23:02", "remaining_time": "8:14:17", "throughput": 2511.35, "total_tokens": 3471520} +{"current_steps": 5985, "total_steps": 134280, "loss": 0.705, "lr": 2.228179922549896e-05, "epoch": 0.8914209115281502, "percentage": 4.46, "elapsed_time": "0:23:03", "remaining_time": "8:14:16", "throughput": 2511.34, "total_tokens": 3474432} +{"current_steps": 5990, "total_steps": 134280, "loss": 0.6178, "lr": 2.2300417039022937e-05, "epoch": 0.8921656240691094, "percentage": 4.46, "elapsed_time": "0:23:04", "remaining_time": "8:14:14", "throughput": 2511.32, "total_tokens": 3477216} +{"current_steps": 5995, "total_steps": 134280, "loss": 0.7024, "lr": 2.231903485254692e-05, "epoch": 0.8929103366100685, "percentage": 4.46, "elapsed_time": "0:23:05", "remaining_time": "8:14:13", "throughput": 2511.36, "total_tokens": 3480160} +{"current_steps": 6000, "total_steps": 134280, "loss": 0.5738, "lr": 2.23376526660709e-05, "epoch": 0.8936550491510277, "percentage": 4.47, "elapsed_time": "0:23:06", "remaining_time": "8:14:11", "throughput": 2511.39, "total_tokens": 3483040} +{"current_steps": 6005, "total_steps": 134280, "loss": 0.6152, "lr": 2.2356270479594875e-05, "epoch": 0.8943997616919869, "percentage": 4.47, "elapsed_time": "0:23:08", "remaining_time": "8:14:10", "throughput": 2511.36, "total_tokens": 3485824} +{"current_steps": 6010, "total_steps": 134280, "loss": 0.6462, "lr": 2.2374888293118857e-05, "epoch": 0.8951444742329461, "percentage": 4.48, "elapsed_time": "0:23:09", "remaining_time": "8:14:07", "throughput": 2511.35, "total_tokens": 3488544} +{"current_steps": 6015, "total_steps": 134280, "loss": 0.6937, "lr": 2.2393506106642835e-05, "epoch": 0.8958891867739053, "percentage": 4.48, "elapsed_time": "0:23:10", "remaining_time": "8:14:07", "throughput": 2511.38, "total_tokens": 3491680} +{"current_steps": 6020, "total_steps": 134280, "loss": 0.7714, "lr": 2.2412123920166817e-05, "epoch": 0.8966338993148645, "percentage": 4.48, "elapsed_time": "0:23:11", "remaining_time": "8:14:08", "throughput": 2511.4, "total_tokens": 3494784} +{"current_steps": 6025, "total_steps": 134280, "loss": 0.6494, "lr": 2.2430741733690795e-05, "epoch": 0.8973786118558237, "percentage": 4.49, "elapsed_time": "0:23:12", "remaining_time": "8:14:06", "throughput": 2511.34, "total_tokens": 3497504} +{"current_steps": 6030, "total_steps": 134280, "loss": 0.5968, "lr": 2.2449359547214777e-05, "epoch": 0.8981233243967829, "percentage": 4.49, "elapsed_time": "0:23:13", "remaining_time": "8:14:05", "throughput": 2511.34, "total_tokens": 3500416} +{"current_steps": 6035, "total_steps": 134280, "loss": 0.829, "lr": 2.246797736073876e-05, "epoch": 0.898868036937742, "percentage": 4.49, "elapsed_time": "0:23:14", "remaining_time": "8:14:03", "throughput": 2511.29, "total_tokens": 3503168} +{"current_steps": 6040, "total_steps": 134280, "loss": 0.7809, "lr": 2.2486595174262737e-05, "epoch": 0.8996127494787012, "percentage": 4.5, "elapsed_time": "0:23:16", "remaining_time": "8:14:02", "throughput": 2511.27, "total_tokens": 3506080} +{"current_steps": 6045, "total_steps": 134280, "loss": 0.7254, "lr": 2.2505212987786715e-05, "epoch": 0.9003574620196604, "percentage": 4.5, "elapsed_time": "0:23:17", "remaining_time": "8:14:02", "throughput": 2511.35, "total_tokens": 3509216} +{"current_steps": 6050, "total_steps": 134280, "loss": 0.7901, "lr": 2.2523830801310693e-05, "epoch": 0.9011021745606196, "percentage": 4.51, "elapsed_time": "0:23:18", "remaining_time": "8:14:00", "throughput": 2511.38, "total_tokens": 3512064} +{"current_steps": 6055, "total_steps": 134280, "loss": 0.6813, "lr": 2.2542448614834675e-05, "epoch": 0.9018468871015788, "percentage": 4.51, "elapsed_time": "0:23:19", "remaining_time": "8:13:58", "throughput": 2511.34, "total_tokens": 3514784} +{"current_steps": 6060, "total_steps": 134280, "loss": 0.631, "lr": 2.2561066428358653e-05, "epoch": 0.902591599642538, "percentage": 4.51, "elapsed_time": "0:23:20", "remaining_time": "8:13:59", "throughput": 2511.37, "total_tokens": 3518048} +{"current_steps": 6065, "total_steps": 134280, "loss": 0.6258, "lr": 2.2579684241882634e-05, "epoch": 0.9033363121834972, "percentage": 4.52, "elapsed_time": "0:23:22", "remaining_time": "8:13:59", "throughput": 2511.43, "total_tokens": 3521184} +{"current_steps": 6070, "total_steps": 134280, "loss": 0.6255, "lr": 2.2598302055406613e-05, "epoch": 0.9040810247244564, "percentage": 4.52, "elapsed_time": "0:23:23", "remaining_time": "8:13:59", "throughput": 2511.49, "total_tokens": 3524224} +{"current_steps": 6075, "total_steps": 134280, "loss": 0.6915, "lr": 2.2616919868930594e-05, "epoch": 0.9048257372654156, "percentage": 4.52, "elapsed_time": "0:23:24", "remaining_time": "8:13:57", "throughput": 2511.51, "total_tokens": 3527104} +{"current_steps": 6080, "total_steps": 134280, "loss": 0.589, "lr": 2.2635537682454576e-05, "epoch": 0.9055704498063747, "percentage": 4.53, "elapsed_time": "0:23:25", "remaining_time": "8:13:55", "throughput": 2511.48, "total_tokens": 3529824} +{"current_steps": 6085, "total_steps": 134280, "loss": 0.7859, "lr": 2.2654155495978554e-05, "epoch": 0.9063151623473339, "percentage": 4.53, "elapsed_time": "0:23:26", "remaining_time": "8:13:54", "throughput": 2511.49, "total_tokens": 3532768} +{"current_steps": 6090, "total_steps": 134280, "loss": 0.6025, "lr": 2.2672773309502532e-05, "epoch": 0.9070598748882931, "percentage": 4.54, "elapsed_time": "0:23:27", "remaining_time": "8:13:52", "throughput": 2511.45, "total_tokens": 3535552} +{"current_steps": 6095, "total_steps": 134280, "loss": 0.6901, "lr": 2.269139112302651e-05, "epoch": 0.9078045874292523, "percentage": 4.54, "elapsed_time": "0:23:28", "remaining_time": "8:13:50", "throughput": 2511.43, "total_tokens": 3538336} +{"current_steps": 6100, "total_steps": 134280, "loss": 0.8423, "lr": 2.2710008936550492e-05, "epoch": 0.9085492999702115, "percentage": 4.54, "elapsed_time": "0:23:29", "remaining_time": "8:13:47", "throughput": 2511.35, "total_tokens": 3540928} +{"current_steps": 6105, "total_steps": 134280, "loss": 0.634, "lr": 2.272862675007447e-05, "epoch": 0.9092940125111707, "percentage": 4.55, "elapsed_time": "0:23:31", "remaining_time": "8:13:48", "throughput": 2511.35, "total_tokens": 3544000} +{"current_steps": 6110, "total_steps": 134280, "loss": 0.8218, "lr": 2.2747244563598452e-05, "epoch": 0.9100387250521299, "percentage": 4.55, "elapsed_time": "0:23:32", "remaining_time": "8:13:46", "throughput": 2511.32, "total_tokens": 3546784} +{"current_steps": 6115, "total_steps": 134280, "loss": 0.6011, "lr": 2.2765862377122434e-05, "epoch": 0.9107834375930891, "percentage": 4.55, "elapsed_time": "0:23:33", "remaining_time": "8:13:45", "throughput": 2511.3, "total_tokens": 3549696} +{"current_steps": 6120, "total_steps": 134280, "loss": 0.5222, "lr": 2.2784480190646412e-05, "epoch": 0.9115281501340483, "percentage": 4.56, "elapsed_time": "0:23:34", "remaining_time": "8:13:43", "throughput": 2511.25, "total_tokens": 3552480} +{"current_steps": 6125, "total_steps": 134280, "loss": 0.5456, "lr": 2.2803098004170394e-05, "epoch": 0.9122728626750074, "percentage": 4.56, "elapsed_time": "0:23:35", "remaining_time": "8:13:42", "throughput": 2511.27, "total_tokens": 3555360} +{"current_steps": 6130, "total_steps": 134280, "loss": 0.6588, "lr": 2.2821715817694372e-05, "epoch": 0.9130175752159666, "percentage": 4.57, "elapsed_time": "0:23:36", "remaining_time": "8:13:42", "throughput": 2511.35, "total_tokens": 3558528} +{"current_steps": 6135, "total_steps": 134280, "loss": 0.6591, "lr": 2.284033363121835e-05, "epoch": 0.9137622877569258, "percentage": 4.57, "elapsed_time": "0:23:38", "remaining_time": "8:13:40", "throughput": 2511.33, "total_tokens": 3561280} +{"current_steps": 6140, "total_steps": 134280, "loss": 0.4799, "lr": 2.2858951444742328e-05, "epoch": 0.914507000297885, "percentage": 4.57, "elapsed_time": "0:23:39", "remaining_time": "8:13:41", "throughput": 2511.39, "total_tokens": 3564544} +{"current_steps": 6145, "total_steps": 134280, "loss": 0.7415, "lr": 2.287756925826631e-05, "epoch": 0.9152517128388442, "percentage": 4.58, "elapsed_time": "0:23:40", "remaining_time": "8:13:38", "throughput": 2511.31, "total_tokens": 3567104} +{"current_steps": 6150, "total_steps": 134280, "loss": 0.5169, "lr": 2.289618707179029e-05, "epoch": 0.9159964253798034, "percentage": 4.58, "elapsed_time": "0:23:41", "remaining_time": "8:13:37", "throughput": 2511.38, "total_tokens": 3570080} +{"current_steps": 6155, "total_steps": 134280, "loss": 0.6865, "lr": 2.291480488531427e-05, "epoch": 0.9167411379207626, "percentage": 4.58, "elapsed_time": "0:23:42", "remaining_time": "8:13:36", "throughput": 2511.41, "total_tokens": 3573056} +{"current_steps": 6160, "total_steps": 134280, "loss": 0.7117, "lr": 2.293342269883825e-05, "epoch": 0.9174858504617218, "percentage": 4.59, "elapsed_time": "0:23:43", "remaining_time": "8:13:35", "throughput": 2511.42, "total_tokens": 3576064} +{"current_steps": 6165, "total_steps": 134280, "loss": 0.7159, "lr": 2.295204051236223e-05, "epoch": 0.9182305630026809, "percentage": 4.59, "elapsed_time": "0:23:45", "remaining_time": "8:13:34", "throughput": 2511.48, "total_tokens": 3579040} +{"current_steps": 6170, "total_steps": 134280, "loss": 0.5716, "lr": 2.297065832588621e-05, "epoch": 0.9189752755436401, "percentage": 4.59, "elapsed_time": "0:23:46", "remaining_time": "8:13:33", "throughput": 2511.51, "total_tokens": 3581984} +{"current_steps": 6175, "total_steps": 134280, "loss": 0.6916, "lr": 2.2989276139410186e-05, "epoch": 0.9197199880845993, "percentage": 4.6, "elapsed_time": "0:23:47", "remaining_time": "8:13:32", "throughput": 2511.56, "total_tokens": 3584960} +{"current_steps": 6180, "total_steps": 134280, "loss": 0.6725, "lr": 2.3007893952934168e-05, "epoch": 0.9204647006255585, "percentage": 4.6, "elapsed_time": "0:23:48", "remaining_time": "8:13:30", "throughput": 2511.53, "total_tokens": 3587808} +{"current_steps": 6185, "total_steps": 134280, "loss": 0.6135, "lr": 2.3026511766458146e-05, "epoch": 0.9212094131665177, "percentage": 4.61, "elapsed_time": "0:23:49", "remaining_time": "8:13:29", "throughput": 2511.49, "total_tokens": 3590656} +{"current_steps": 6190, "total_steps": 134280, "loss": 0.8301, "lr": 2.3045129579982128e-05, "epoch": 0.9219541257074769, "percentage": 4.61, "elapsed_time": "0:23:50", "remaining_time": "8:13:26", "throughput": 2511.43, "total_tokens": 3593248} +{"current_steps": 6195, "total_steps": 134280, "loss": 0.5812, "lr": 2.306374739350611e-05, "epoch": 0.9226988382484361, "percentage": 4.61, "elapsed_time": "0:23:51", "remaining_time": "8:13:26", "throughput": 2511.41, "total_tokens": 3596192} +{"current_steps": 6200, "total_steps": 134280, "loss": 0.7691, "lr": 2.3082365207030087e-05, "epoch": 0.9234435507893953, "percentage": 4.62, "elapsed_time": "0:23:53", "remaining_time": "8:13:26", "throughput": 2511.44, "total_tokens": 3599264} +{"current_steps": 6205, "total_steps": 134280, "loss": 0.5998, "lr": 2.310098302055407e-05, "epoch": 0.9241882633303545, "percentage": 4.62, "elapsed_time": "0:23:54", "remaining_time": "8:13:26", "throughput": 2511.43, "total_tokens": 3602304} +{"current_steps": 6210, "total_steps": 134280, "loss": 0.605, "lr": 2.3119600834078047e-05, "epoch": 0.9249329758713136, "percentage": 4.62, "elapsed_time": "0:23:55", "remaining_time": "8:13:24", "throughput": 2511.39, "total_tokens": 3605056} +{"current_steps": 6215, "total_steps": 134280, "loss": 0.5642, "lr": 2.313821864760203e-05, "epoch": 0.9256776884122728, "percentage": 4.63, "elapsed_time": "0:23:56", "remaining_time": "8:13:22", "throughput": 2511.42, "total_tokens": 3607904} +{"current_steps": 6220, "total_steps": 134280, "loss": 0.7669, "lr": 2.3156836461126004e-05, "epoch": 0.926422400953232, "percentage": 4.63, "elapsed_time": "0:23:57", "remaining_time": "8:13:22", "throughput": 2511.48, "total_tokens": 3611008} +{"current_steps": 6225, "total_steps": 134280, "loss": 0.8955, "lr": 2.3175454274649985e-05, "epoch": 0.9271671134941912, "percentage": 4.64, "elapsed_time": "0:23:58", "remaining_time": "8:13:20", "throughput": 2511.5, "total_tokens": 3613920} +{"current_steps": 6230, "total_steps": 134280, "loss": 0.5576, "lr": 2.3194072088173967e-05, "epoch": 0.9279118260351504, "percentage": 4.64, "elapsed_time": "0:24:00", "remaining_time": "8:13:18", "throughput": 2511.45, "total_tokens": 3616608} +{"current_steps": 6235, "total_steps": 134280, "loss": 0.6201, "lr": 2.3212689901697945e-05, "epoch": 0.9286565385761096, "percentage": 4.64, "elapsed_time": "0:24:01", "remaining_time": "8:13:18", "throughput": 2511.53, "total_tokens": 3619776} +{"current_steps": 6240, "total_steps": 134280, "loss": 0.6388, "lr": 2.3231307715221927e-05, "epoch": 0.9294012511170688, "percentage": 4.65, "elapsed_time": "0:24:02", "remaining_time": "8:13:16", "throughput": 2511.56, "total_tokens": 3622624} +{"current_steps": 6245, "total_steps": 134280, "loss": 0.477, "lr": 2.3249925528745905e-05, "epoch": 0.930145963658028, "percentage": 4.65, "elapsed_time": "0:24:03", "remaining_time": "8:13:15", "throughput": 2511.57, "total_tokens": 3625536} +{"current_steps": 6250, "total_steps": 134280, "loss": 0.6527, "lr": 2.3268543342269887e-05, "epoch": 0.9308906761989872, "percentage": 4.65, "elapsed_time": "0:24:04", "remaining_time": "8:13:13", "throughput": 2511.56, "total_tokens": 3628288} +{"current_steps": 6255, "total_steps": 134280, "loss": 0.7162, "lr": 2.3287161155793865e-05, "epoch": 0.9316353887399463, "percentage": 4.66, "elapsed_time": "0:24:05", "remaining_time": "8:13:11", "throughput": 2511.57, "total_tokens": 3631200} +{"current_steps": 6260, "total_steps": 134280, "loss": 0.7502, "lr": 2.3305778969317847e-05, "epoch": 0.9323801012809055, "percentage": 4.66, "elapsed_time": "0:24:06", "remaining_time": "8:13:10", "throughput": 2511.6, "total_tokens": 3634144} +{"current_steps": 6265, "total_steps": 134280, "loss": 0.6446, "lr": 2.332439678284182e-05, "epoch": 0.9331248138218647, "percentage": 4.67, "elapsed_time": "0:24:08", "remaining_time": "8:13:09", "throughput": 2511.58, "total_tokens": 3637024} +{"current_steps": 6270, "total_steps": 134280, "loss": 0.8359, "lr": 2.3343014596365803e-05, "epoch": 0.9338695263628239, "percentage": 4.67, "elapsed_time": "0:24:09", "remaining_time": "8:13:09", "throughput": 2511.57, "total_tokens": 3640000} +{"current_steps": 6275, "total_steps": 134280, "loss": 0.8468, "lr": 2.3361632409889785e-05, "epoch": 0.9346142389037831, "percentage": 4.67, "elapsed_time": "0:24:10", "remaining_time": "8:13:09", "throughput": 2511.61, "total_tokens": 3643168} +{"current_steps": 6280, "total_steps": 134280, "loss": 0.5435, "lr": 2.3380250223413763e-05, "epoch": 0.9353589514447423, "percentage": 4.68, "elapsed_time": "0:24:11", "remaining_time": "8:13:07", "throughput": 2511.55, "total_tokens": 3645856} +{"current_steps": 6285, "total_steps": 134280, "loss": 0.7711, "lr": 2.3398868036937744e-05, "epoch": 0.9361036639857016, "percentage": 4.68, "elapsed_time": "0:24:12", "remaining_time": "8:13:04", "throughput": 2511.5, "total_tokens": 3648480} +{"current_steps": 6290, "total_steps": 134280, "loss": 0.6367, "lr": 2.3417485850461723e-05, "epoch": 0.9368483765266608, "percentage": 4.68, "elapsed_time": "0:24:13", "remaining_time": "8:13:02", "throughput": 2511.45, "total_tokens": 3651168} +{"current_steps": 6295, "total_steps": 134280, "loss": 0.6985, "lr": 2.3436103663985704e-05, "epoch": 0.9375930890676198, "percentage": 4.69, "elapsed_time": "0:24:14", "remaining_time": "8:13:00", "throughput": 2511.52, "total_tokens": 3654144} +{"current_steps": 6300, "total_steps": 134280, "loss": 0.8477, "lr": 2.3454721477509683e-05, "epoch": 0.938337801608579, "percentage": 4.69, "elapsed_time": "0:24:16", "remaining_time": "8:12:59", "throughput": 2511.51, "total_tokens": 3657056} +{"current_steps": 6305, "total_steps": 134280, "loss": 0.6986, "lr": 2.347333929103366e-05, "epoch": 0.9390825141495382, "percentage": 4.7, "elapsed_time": "0:24:17", "remaining_time": "8:13:00", "throughput": 2511.55, "total_tokens": 3660192} +{"current_steps": 6310, "total_steps": 134280, "loss": 0.5991, "lr": 2.3491957104557642e-05, "epoch": 0.9398272266904975, "percentage": 4.7, "elapsed_time": "0:24:18", "remaining_time": "8:12:58", "throughput": 2511.57, "total_tokens": 3663008} +{"current_steps": 6315, "total_steps": 134280, "loss": 0.7087, "lr": 2.351057491808162e-05, "epoch": 0.9405719392314567, "percentage": 4.7, "elapsed_time": "0:24:19", "remaining_time": "8:12:56", "throughput": 2511.63, "total_tokens": 3665984} +{"current_steps": 6320, "total_steps": 134280, "loss": 0.8, "lr": 2.3529192731605602e-05, "epoch": 0.9413166517724159, "percentage": 4.71, "elapsed_time": "0:24:20", "remaining_time": "8:12:55", "throughput": 2511.66, "total_tokens": 3668896} +{"current_steps": 6325, "total_steps": 134280, "loss": 0.6294, "lr": 2.354781054512958e-05, "epoch": 0.9420613643133751, "percentage": 4.71, "elapsed_time": "0:24:21", "remaining_time": "8:12:53", "throughput": 2511.59, "total_tokens": 3671552} +{"current_steps": 6330, "total_steps": 134280, "loss": 0.7029, "lr": 2.3566428358653562e-05, "epoch": 0.9428060768543343, "percentage": 4.71, "elapsed_time": "0:24:23", "remaining_time": "8:12:52", "throughput": 2511.62, "total_tokens": 3674528} +{"current_steps": 6335, "total_steps": 134280, "loss": 0.7643, "lr": 2.358504617217754e-05, "epoch": 0.9435507893952935, "percentage": 4.72, "elapsed_time": "0:24:24", "remaining_time": "8:12:50", "throughput": 2511.53, "total_tokens": 3677184} +{"current_steps": 6340, "total_steps": 134280, "loss": 0.7008, "lr": 2.3603663985701522e-05, "epoch": 0.9442955019362526, "percentage": 4.72, "elapsed_time": "0:24:25", "remaining_time": "8:12:47", "throughput": 2511.45, "total_tokens": 3679744} +{"current_steps": 6345, "total_steps": 134280, "loss": 0.8038, "lr": 2.36222817992255e-05, "epoch": 0.9450402144772118, "percentage": 4.73, "elapsed_time": "0:24:26", "remaining_time": "8:12:45", "throughput": 2511.45, "total_tokens": 3682624} +{"current_steps": 6350, "total_steps": 134280, "loss": 0.6717, "lr": 2.364089961274948e-05, "epoch": 0.945784927018171, "percentage": 4.73, "elapsed_time": "0:24:27", "remaining_time": "8:12:46", "throughput": 2511.59, "total_tokens": 3685984} +{"current_steps": 6355, "total_steps": 134280, "loss": 0.6199, "lr": 2.365951742627346e-05, "epoch": 0.9465296395591302, "percentage": 4.73, "elapsed_time": "0:24:28", "remaining_time": "8:12:45", "throughput": 2511.58, "total_tokens": 3688800} +{"current_steps": 6360, "total_steps": 134280, "loss": 0.7394, "lr": 2.3678135239797438e-05, "epoch": 0.9472743521000894, "percentage": 4.74, "elapsed_time": "0:24:29", "remaining_time": "8:12:44", "throughput": 2511.61, "total_tokens": 3691840} +{"current_steps": 6365, "total_steps": 134280, "loss": 0.5234, "lr": 2.369675305332142e-05, "epoch": 0.9480190646410486, "percentage": 4.74, "elapsed_time": "0:24:31", "remaining_time": "8:12:42", "throughput": 2511.66, "total_tokens": 3694720} +{"current_steps": 6370, "total_steps": 134280, "loss": 0.719, "lr": 2.3715370866845398e-05, "epoch": 0.9487637771820078, "percentage": 4.74, "elapsed_time": "0:24:32", "remaining_time": "8:12:41", "throughput": 2511.65, "total_tokens": 3697568} +{"current_steps": 6375, "total_steps": 134280, "loss": 0.6655, "lr": 2.373398868036938e-05, "epoch": 0.949508489722967, "percentage": 4.75, "elapsed_time": "0:24:33", "remaining_time": "8:12:39", "throughput": 2511.64, "total_tokens": 3700416} +{"current_steps": 6380, "total_steps": 134280, "loss": 0.6658, "lr": 2.3752606493893358e-05, "epoch": 0.9502532022639262, "percentage": 4.75, "elapsed_time": "0:24:34", "remaining_time": "8:12:38", "throughput": 2511.71, "total_tokens": 3703456} +{"current_steps": 6385, "total_steps": 134280, "loss": 0.5945, "lr": 2.377122430741734e-05, "epoch": 0.9509979148048853, "percentage": 4.75, "elapsed_time": "0:24:35", "remaining_time": "8:12:35", "throughput": 2511.67, "total_tokens": 3706048} +{"current_steps": 6390, "total_steps": 134280, "loss": 0.6587, "lr": 2.3789842120941318e-05, "epoch": 0.9517426273458445, "percentage": 4.76, "elapsed_time": "0:24:36", "remaining_time": "8:12:33", "throughput": 2511.65, "total_tokens": 3708736} +{"current_steps": 6395, "total_steps": 134280, "loss": 0.4081, "lr": 2.3808459934465296e-05, "epoch": 0.9524873398868037, "percentage": 4.76, "elapsed_time": "0:24:37", "remaining_time": "8:12:30", "throughput": 2511.59, "total_tokens": 3711392} +{"current_steps": 6400, "total_steps": 134280, "loss": 0.7961, "lr": 2.3827077747989278e-05, "epoch": 0.9532320524277629, "percentage": 4.77, "elapsed_time": "0:24:38", "remaining_time": "8:12:29", "throughput": 2511.59, "total_tokens": 3714304} +{"current_steps": 6405, "total_steps": 134280, "loss": 0.6045, "lr": 2.3845695561513256e-05, "epoch": 0.9539767649687221, "percentage": 4.77, "elapsed_time": "0:24:39", "remaining_time": "8:12:27", "throughput": 2511.61, "total_tokens": 3717120} +{"current_steps": 6410, "total_steps": 134280, "loss": 0.7087, "lr": 2.3864313375037238e-05, "epoch": 0.9547214775096813, "percentage": 4.77, "elapsed_time": "0:24:41", "remaining_time": "8:12:24", "throughput": 2511.51, "total_tokens": 3719648} +{"current_steps": 6415, "total_steps": 134280, "loss": 0.7117, "lr": 2.3882931188561216e-05, "epoch": 0.9554661900506405, "percentage": 4.78, "elapsed_time": "0:24:42", "remaining_time": "8:12:24", "throughput": 2511.53, "total_tokens": 3722688} +{"current_steps": 6420, "total_steps": 134280, "loss": 0.7494, "lr": 2.3901549002085197e-05, "epoch": 0.9562109025915997, "percentage": 4.78, "elapsed_time": "0:24:43", "remaining_time": "8:12:22", "throughput": 2511.49, "total_tokens": 3725440} +{"current_steps": 6425, "total_steps": 134280, "loss": 0.4408, "lr": 2.3920166815609176e-05, "epoch": 0.9569556151325588, "percentage": 4.78, "elapsed_time": "0:24:44", "remaining_time": "8:12:20", "throughput": 2511.51, "total_tokens": 3728320} +{"current_steps": 6430, "total_steps": 134280, "loss": 0.5902, "lr": 2.3938784629133157e-05, "epoch": 0.957700327673518, "percentage": 4.79, "elapsed_time": "0:24:45", "remaining_time": "8:12:20", "throughput": 2511.56, "total_tokens": 3731360} +{"current_steps": 6435, "total_steps": 134280, "loss": 0.6218, "lr": 2.3957402442657135e-05, "epoch": 0.9584450402144772, "percentage": 4.79, "elapsed_time": "0:24:46", "remaining_time": "8:12:17", "throughput": 2511.51, "total_tokens": 3733984} +{"current_steps": 6440, "total_steps": 134280, "loss": 0.6003, "lr": 2.3976020256181114e-05, "epoch": 0.9591897527554364, "percentage": 4.8, "elapsed_time": "0:24:47", "remaining_time": "8:12:15", "throughput": 2511.53, "total_tokens": 3736832} +{"current_steps": 6445, "total_steps": 134280, "loss": 0.7569, "lr": 2.3994638069705095e-05, "epoch": 0.9599344652963956, "percentage": 4.8, "elapsed_time": "0:24:49", "remaining_time": "8:12:14", "throughput": 2511.56, "total_tokens": 3739808} +{"current_steps": 6450, "total_steps": 134280, "loss": 0.5495, "lr": 2.4013255883229074e-05, "epoch": 0.9606791778373548, "percentage": 4.8, "elapsed_time": "0:24:50", "remaining_time": "8:12:14", "throughput": 2511.56, "total_tokens": 3742816} +{"current_steps": 6455, "total_steps": 134280, "loss": 0.6241, "lr": 2.4031873696753055e-05, "epoch": 0.961423890378314, "percentage": 4.81, "elapsed_time": "0:24:51", "remaining_time": "8:12:13", "throughput": 2511.59, "total_tokens": 3745760} +{"current_steps": 6460, "total_steps": 134280, "loss": 0.7599, "lr": 2.4050491510277033e-05, "epoch": 0.9621686029192732, "percentage": 4.81, "elapsed_time": "0:24:52", "remaining_time": "8:12:11", "throughput": 2511.57, "total_tokens": 3748512} +{"current_steps": 6465, "total_steps": 134280, "loss": 0.7327, "lr": 2.4069109323801015e-05, "epoch": 0.9629133154602324, "percentage": 4.81, "elapsed_time": "0:24:53", "remaining_time": "8:12:10", "throughput": 2511.61, "total_tokens": 3751520} +{"current_steps": 6470, "total_steps": 134280, "loss": 0.8244, "lr": 2.4087727137324993e-05, "epoch": 0.9636580280011915, "percentage": 4.82, "elapsed_time": "0:24:54", "remaining_time": "8:12:08", "throughput": 2511.62, "total_tokens": 3754368} +{"current_steps": 6475, "total_steps": 134280, "loss": 0.6815, "lr": 2.4106344950848975e-05, "epoch": 0.9644027405421507, "percentage": 4.82, "elapsed_time": "0:24:56", "remaining_time": "8:12:09", "throughput": 2511.67, "total_tokens": 3757536} +{"current_steps": 6480, "total_steps": 134280, "loss": 0.572, "lr": 2.4124962764372953e-05, "epoch": 0.9651474530831099, "percentage": 4.83, "elapsed_time": "0:24:57", "remaining_time": "8:12:10", "throughput": 2511.71, "total_tokens": 3760768} +{"current_steps": 6485, "total_steps": 134280, "loss": 0.4967, "lr": 2.414358057789693e-05, "epoch": 0.9658921656240691, "percentage": 4.83, "elapsed_time": "0:24:58", "remaining_time": "8:12:08", "throughput": 2511.71, "total_tokens": 3763584} +{"current_steps": 6490, "total_steps": 134280, "loss": 0.6973, "lr": 2.4162198391420913e-05, "epoch": 0.9666368781650283, "percentage": 4.83, "elapsed_time": "0:24:59", "remaining_time": "8:12:07", "throughput": 2511.73, "total_tokens": 3766560} +{"current_steps": 6495, "total_steps": 134280, "loss": 0.5085, "lr": 2.418081620494489e-05, "epoch": 0.9673815907059875, "percentage": 4.84, "elapsed_time": "0:25:00", "remaining_time": "8:12:08", "throughput": 2511.84, "total_tokens": 3769920} +{"current_steps": 6500, "total_steps": 134280, "loss": 0.5819, "lr": 2.4199434018468873e-05, "epoch": 0.9681263032469467, "percentage": 4.84, "elapsed_time": "0:25:02", "remaining_time": "8:12:07", "throughput": 2511.82, "total_tokens": 3772800} +{"current_steps": 6505, "total_steps": 134280, "loss": 0.5953, "lr": 2.421805183199285e-05, "epoch": 0.9688710157879059, "percentage": 4.84, "elapsed_time": "0:25:03", "remaining_time": "8:12:06", "throughput": 2511.84, "total_tokens": 3775712} +{"current_steps": 6510, "total_steps": 134280, "loss": 0.5862, "lr": 2.4236669645516833e-05, "epoch": 0.9696157283288651, "percentage": 4.85, "elapsed_time": "0:25:04", "remaining_time": "8:12:04", "throughput": 2511.81, "total_tokens": 3778496} +{"current_steps": 6515, "total_steps": 134280, "loss": 0.6335, "lr": 2.425528745904081e-05, "epoch": 0.9703604408698242, "percentage": 4.85, "elapsed_time": "0:25:05", "remaining_time": "8:12:05", "throughput": 2511.82, "total_tokens": 3781664} +{"current_steps": 6520, "total_steps": 134280, "loss": 0.888, "lr": 2.4273905272564793e-05, "epoch": 0.9711051534107834, "percentage": 4.86, "elapsed_time": "0:25:06", "remaining_time": "8:12:02", "throughput": 2511.83, "total_tokens": 3784416} +{"current_steps": 6525, "total_steps": 134280, "loss": 0.6984, "lr": 2.429252308608877e-05, "epoch": 0.9718498659517426, "percentage": 4.86, "elapsed_time": "0:25:07", "remaining_time": "8:12:00", "throughput": 2511.82, "total_tokens": 3787168} +{"current_steps": 6530, "total_steps": 134280, "loss": 0.6532, "lr": 2.431114089961275e-05, "epoch": 0.9725945784927018, "percentage": 4.86, "elapsed_time": "0:25:08", "remaining_time": "8:11:59", "throughput": 2511.86, "total_tokens": 3790144} +{"current_steps": 6535, "total_steps": 134280, "loss": 0.6717, "lr": 2.432975871313673e-05, "epoch": 0.973339291033661, "percentage": 4.87, "elapsed_time": "0:25:10", "remaining_time": "8:11:57", "throughput": 2511.85, "total_tokens": 3792992} +{"current_steps": 6540, "total_steps": 134280, "loss": 0.8229, "lr": 2.434837652666071e-05, "epoch": 0.9740840035746202, "percentage": 4.87, "elapsed_time": "0:25:11", "remaining_time": "8:11:56", "throughput": 2511.86, "total_tokens": 3795840} +{"current_steps": 6545, "total_steps": 134280, "loss": 0.7582, "lr": 2.436699434018469e-05, "epoch": 0.9748287161155794, "percentage": 4.87, "elapsed_time": "0:25:12", "remaining_time": "8:11:53", "throughput": 2511.78, "total_tokens": 3798464} +{"current_steps": 6550, "total_steps": 134280, "loss": 0.6376, "lr": 2.438561215370867e-05, "epoch": 0.9755734286565386, "percentage": 4.88, "elapsed_time": "0:25:13", "remaining_time": "8:11:53", "throughput": 2511.78, "total_tokens": 3801472} +{"current_steps": 6555, "total_steps": 134280, "loss": 0.5809, "lr": 2.440422996723265e-05, "epoch": 0.9763181411974977, "percentage": 4.88, "elapsed_time": "0:25:14", "remaining_time": "8:11:52", "throughput": 2511.77, "total_tokens": 3804320} +{"current_steps": 6560, "total_steps": 134280, "loss": 0.6798, "lr": 2.4422847780756632e-05, "epoch": 0.9770628537384569, "percentage": 4.89, "elapsed_time": "0:25:15", "remaining_time": "8:11:49", "throughput": 2511.75, "total_tokens": 3807072} +{"current_steps": 6565, "total_steps": 134280, "loss": 0.7352, "lr": 2.4441465594280607e-05, "epoch": 0.9778075662794161, "percentage": 4.89, "elapsed_time": "0:25:16", "remaining_time": "8:11:49", "throughput": 2511.71, "total_tokens": 3809984} +{"current_steps": 6570, "total_steps": 134280, "loss": 0.6725, "lr": 2.446008340780459e-05, "epoch": 0.9785522788203753, "percentage": 4.89, "elapsed_time": "0:25:18", "remaining_time": "8:11:49", "throughput": 2511.74, "total_tokens": 3813024} +{"current_steps": 6575, "total_steps": 134280, "loss": 0.6835, "lr": 2.4478701221328567e-05, "epoch": 0.9792969913613345, "percentage": 4.9, "elapsed_time": "0:25:19", "remaining_time": "8:11:46", "throughput": 2511.66, "total_tokens": 3815584} +{"current_steps": 6580, "total_steps": 134280, "loss": 0.5737, "lr": 2.4497319034852548e-05, "epoch": 0.9800417039022937, "percentage": 4.9, "elapsed_time": "0:25:20", "remaining_time": "8:11:43", "throughput": 2511.64, "total_tokens": 3818272} +{"current_steps": 6585, "total_steps": 134280, "loss": 0.4754, "lr": 2.4515936848376527e-05, "epoch": 0.9807864164432529, "percentage": 4.9, "elapsed_time": "0:25:21", "remaining_time": "8:11:42", "throughput": 2511.57, "total_tokens": 3821088} +{"current_steps": 6590, "total_steps": 134280, "loss": 0.6228, "lr": 2.4534554661900508e-05, "epoch": 0.9815311289842121, "percentage": 4.91, "elapsed_time": "0:25:22", "remaining_time": "8:11:40", "throughput": 2511.55, "total_tokens": 3823872} +{"current_steps": 6595, "total_steps": 134280, "loss": 0.6073, "lr": 2.4553172475424486e-05, "epoch": 0.9822758415251713, "percentage": 4.91, "elapsed_time": "0:25:23", "remaining_time": "8:11:39", "throughput": 2511.54, "total_tokens": 3826752} +{"current_steps": 6600, "total_steps": 134280, "loss": 0.6688, "lr": 2.4571790288948468e-05, "epoch": 0.9830205540661304, "percentage": 4.92, "elapsed_time": "0:25:24", "remaining_time": "8:11:37", "throughput": 2511.53, "total_tokens": 3829504} +{"current_steps": 6605, "total_steps": 134280, "loss": 0.5275, "lr": 2.459040810247245e-05, "epoch": 0.9837652666070896, "percentage": 4.92, "elapsed_time": "0:25:25", "remaining_time": "8:11:36", "throughput": 2511.54, "total_tokens": 3832448} +{"current_steps": 6610, "total_steps": 134280, "loss": 0.6701, "lr": 2.4609025915996424e-05, "epoch": 0.9845099791480488, "percentage": 4.92, "elapsed_time": "0:25:27", "remaining_time": "8:11:35", "throughput": 2511.59, "total_tokens": 3835456} +{"current_steps": 6615, "total_steps": 134280, "loss": 0.6198, "lr": 2.4627643729520406e-05, "epoch": 0.985254691689008, "percentage": 4.93, "elapsed_time": "0:25:28", "remaining_time": "8:11:34", "throughput": 2511.67, "total_tokens": 3838560} +{"current_steps": 6620, "total_steps": 134280, "loss": 0.7882, "lr": 2.4646261543044384e-05, "epoch": 0.9859994042299672, "percentage": 4.93, "elapsed_time": "0:25:29", "remaining_time": "8:11:33", "throughput": 2511.73, "total_tokens": 3841568} +{"current_steps": 6625, "total_steps": 134280, "loss": 0.7997, "lr": 2.4664879356568366e-05, "epoch": 0.9867441167709264, "percentage": 4.93, "elapsed_time": "0:25:30", "remaining_time": "8:11:32", "throughput": 2511.72, "total_tokens": 3844384} +{"current_steps": 6630, "total_steps": 134280, "loss": 0.6079, "lr": 2.4683497170092344e-05, "epoch": 0.9874888293118856, "percentage": 4.94, "elapsed_time": "0:25:31", "remaining_time": "8:11:33", "throughput": 2511.74, "total_tokens": 3847616} +{"current_steps": 6635, "total_steps": 134280, "loss": 0.7518, "lr": 2.4702114983616326e-05, "epoch": 0.9882335418528448, "percentage": 4.94, "elapsed_time": "0:25:32", "remaining_time": "8:11:31", "throughput": 2511.74, "total_tokens": 3850496} +{"current_steps": 6640, "total_steps": 134280, "loss": 0.6165, "lr": 2.4720732797140307e-05, "epoch": 0.988978254393804, "percentage": 4.94, "elapsed_time": "0:25:34", "remaining_time": "8:11:31", "throughput": 2511.8, "total_tokens": 3853600} +{"current_steps": 6645, "total_steps": 134280, "loss": 0.6925, "lr": 2.4739350610664286e-05, "epoch": 0.9897229669347631, "percentage": 4.95, "elapsed_time": "0:25:35", "remaining_time": "8:11:30", "throughput": 2511.79, "total_tokens": 3856416} +{"current_steps": 6650, "total_steps": 134280, "loss": 0.6268, "lr": 2.4757968424188267e-05, "epoch": 0.9904676794757223, "percentage": 4.95, "elapsed_time": "0:25:36", "remaining_time": "8:11:27", "throughput": 2511.71, "total_tokens": 3858976} +{"current_steps": 6655, "total_steps": 134280, "loss": 0.7361, "lr": 2.4776586237712242e-05, "epoch": 0.9912123920166815, "percentage": 4.96, "elapsed_time": "0:25:37", "remaining_time": "8:11:26", "throughput": 2511.76, "total_tokens": 3861984} +{"current_steps": 6660, "total_steps": 134280, "loss": 0.7769, "lr": 2.4795204051236224e-05, "epoch": 0.9919571045576407, "percentage": 4.96, "elapsed_time": "0:25:38", "remaining_time": "8:11:24", "throughput": 2511.74, "total_tokens": 3864768} +{"current_steps": 6665, "total_steps": 134280, "loss": 0.5893, "lr": 2.4813821864760202e-05, "epoch": 0.9927018170986, "percentage": 4.96, "elapsed_time": "0:25:39", "remaining_time": "8:11:23", "throughput": 2511.75, "total_tokens": 3867680} +{"current_steps": 6670, "total_steps": 134280, "loss": 0.6631, "lr": 2.4832439678284184e-05, "epoch": 0.9934465296395592, "percentage": 4.97, "elapsed_time": "0:25:40", "remaining_time": "8:11:21", "throughput": 2511.77, "total_tokens": 3870560} +{"current_steps": 6675, "total_steps": 134280, "loss": 0.5712, "lr": 2.4851057491808162e-05, "epoch": 0.9941912421805184, "percentage": 4.97, "elapsed_time": "0:25:42", "remaining_time": "8:11:20", "throughput": 2511.77, "total_tokens": 3873408} +{"current_steps": 6680, "total_steps": 134280, "loss": 0.7119, "lr": 2.4869675305332143e-05, "epoch": 0.9949359547214776, "percentage": 4.97, "elapsed_time": "0:25:43", "remaining_time": "8:11:18", "throughput": 2511.81, "total_tokens": 3876320} +{"current_steps": 6685, "total_steps": 134280, "loss": 0.6968, "lr": 2.4888293118856125e-05, "epoch": 0.9956806672624366, "percentage": 4.98, "elapsed_time": "0:25:44", "remaining_time": "8:11:16", "throughput": 2511.75, "total_tokens": 3879008} +{"current_steps": 6690, "total_steps": 134280, "loss": 0.6994, "lr": 2.4906910932380103e-05, "epoch": 0.9964253798033958, "percentage": 4.98, "elapsed_time": "0:25:45", "remaining_time": "8:11:14", "throughput": 2511.71, "total_tokens": 3881760} +{"current_steps": 6695, "total_steps": 134280, "loss": 0.7024, "lr": 2.492552874590408e-05, "epoch": 0.997170092344355, "percentage": 4.99, "elapsed_time": "0:25:46", "remaining_time": "8:11:13", "throughput": 2511.75, "total_tokens": 3884672} +{"current_steps": 6700, "total_steps": 134280, "loss": 0.613, "lr": 2.494414655942806e-05, "epoch": 0.9979148048853143, "percentage": 4.99, "elapsed_time": "0:25:47", "remaining_time": "8:11:10", "throughput": 2511.74, "total_tokens": 3887360} +{"current_steps": 6705, "total_steps": 134280, "loss": 0.6612, "lr": 2.496276437295204e-05, "epoch": 0.9986595174262735, "percentage": 4.99, "elapsed_time": "0:25:48", "remaining_time": "8:11:08", "throughput": 2511.63, "total_tokens": 3889920} +{"current_steps": 6710, "total_steps": 134280, "loss": 0.5315, "lr": 2.498138218647602e-05, "epoch": 0.9994042299672327, "percentage": 5.0, "elapsed_time": "0:25:49", "remaining_time": "8:11:06", "throughput": 2511.61, "total_tokens": 3892704} +{"current_steps": 6714, "total_steps": 134280, "eval_loss": 0.6720787286758423, "epoch": 1.0, "percentage": 5.0, "elapsed_time": "0:26:42", "remaining_time": "8:27:18", "throughput": 2431.03, "total_tokens": 3894552} +{"current_steps": 6715, "total_steps": 134280, "loss": 0.5735, "lr": 2.5e-05, "epoch": 1.0001489425081918, "percentage": 5.0, "elapsed_time": "0:26:43", "remaining_time": "8:27:44", "throughput": 2428.9, "total_tokens": 3895096} +{"current_steps": 6720, "total_steps": 134280, "loss": 0.565, "lr": 2.5018617813523983e-05, "epoch": 1.000893655049151, "percentage": 5.0, "elapsed_time": "0:26:45", "remaining_time": "8:27:51", "throughput": 2428.4, "total_tokens": 3898200} +{"current_steps": 6725, "total_steps": 134280, "loss": 0.5842, "lr": 2.503723562704796e-05, "epoch": 1.0016383675901102, "percentage": 5.01, "elapsed_time": "0:26:46", "remaining_time": "8:27:48", "throughput": 2428.44, "total_tokens": 3900984} +{"current_steps": 6730, "total_steps": 134280, "loss": 0.6241, "lr": 2.5055853440571943e-05, "epoch": 1.0023830801310694, "percentage": 5.01, "elapsed_time": "0:26:47", "remaining_time": "8:27:46", "throughput": 2428.5, "total_tokens": 3903928} +{"current_steps": 6735, "total_steps": 134280, "loss": 0.8063, "lr": 2.507447125409592e-05, "epoch": 1.0031277926720286, "percentage": 5.02, "elapsed_time": "0:26:48", "remaining_time": "8:27:44", "throughput": 2428.61, "total_tokens": 3906840}